PyPI - pydantic-ai-slim - Versions diffs - 0.0.13__py3-none-any.whl → 0.0.14__py3-none-any.whl - Mend

pydantic-ai-slim 0.0.13py3-none-any.whl → 0.0.14py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of pydantic-ai-slim might be problematic. Click here for more details.

Files changed (21) hide show

pydantic_ai/__init__.py +12 -2
pydantic_ai/_result.py +4 -7
pydantic_ai/_system_prompt.py +2 -2
pydantic_ai/agent.py +85 -75
pydantic_ai/exceptions.py +20 -2
pydantic_ai/messages.py +29 -7
pydantic_ai/models/__init__.py +10 -9
pydantic_ai/models/anthropic.py +12 -12
pydantic_ai/models/function.py +16 -22
pydantic_ai/models/gemini.py +16 -18
pydantic_ai/models/groq.py +21 -23
pydantic_ai/models/mistral.py +24 -36
pydantic_ai/models/openai.py +21 -23
pydantic_ai/models/test.py +23 -17
pydantic_ai/result.py +63 -33
pydantic_ai/settings.py +65 -0
pydantic_ai/tools.py +24 -14
{pydantic_ai_slim-0.0.13.dist-info → pydantic_ai_slim-0.0.14.dist-info}/METADATA +1 -1
pydantic_ai_slim-0.0.14.dist-info/RECORD +26 -0
pydantic_ai_slim-0.0.13.dist-info/RECORD +0 -26
{pydantic_ai_slim-0.0.13.dist-info → pydantic_ai_slim-0.0.14.dist-info}/WHEEL +0 -0

pydantic_ai/__init__.py CHANGED Viewed

@@ -1,8 +1,18 @@
 from importlib.metadata import version
 from .agent import Agent
-from .exceptions import ModelRetry, UnexpectedModelBehavior, UserError
+from .exceptions import AgentRunError, ModelRetry, UnexpectedModelBehavior, UsageLimitExceeded, UserError
 from .tools import RunContext, Tool
-__all__ = 'Agent', 'Tool', 'RunContext', 'ModelRetry', 'UnexpectedModelBehavior', 'UserError', '__version__'
+__all__ = (
+    'Agent',
+    'RunContext',
+    'Tool',
+    'AgentRunError',
+    'ModelRetry',
+    'UnexpectedModelBehavior',
+    'UsageLimitExceeded',
+    'UserError',
+    '__version__',
+)
 __version__ = version('pydantic_ai_slim')

pydantic_ai/_result.py CHANGED Viewed

@@ -29,25 +29,22 @@ class ResultValidator(Generic[AgentDeps, ResultData]):
     async def validate(
         self,
         result: ResultData,
-        deps: AgentDeps,
-        retry: int,
         tool_call: _messages.ToolCallPart | None,
-        messages: list[_messages.ModelMessage],
+        run_context: RunContext[AgentDeps],
     ) -> ResultData:
         """Validate a result but calling the function.
         Args:
             result: The result data after Pydantic validation the message content.
-            deps: The agent dependencies.
-            retry: The current retry number.
             tool_call: The original tool call message, `None` if there was no tool call.
-            messages: The messages exchanged so far in the conversation.
+            run_context: The current run context.
         Returns:
             Result of either the validated result data (ok) or a retry message (Err).
         """
         if self._takes_ctx:
-            args = RunContext(deps, retry, messages, tool_call.tool_name if tool_call else None), result
+            ctx = run_context.replace_with(tool_name=tool_call.tool_name if tool_call else None)
+            args = ctx, result
         else:
             args = (result,)

pydantic_ai/_system_prompt.py CHANGED Viewed

@@ -19,9 +19,9 @@ class SystemPromptRunner(Generic[AgentDeps]):
         self._takes_ctx = len(inspect.signature(self.function).parameters) > 0
         self._is_async = inspect.iscoroutinefunction(self.function)
-    async def run(self, deps: AgentDeps) -> str:
+    async def run(self, run_context: RunContext[AgentDeps]) -> str:
         if self._takes_ctx:
-            args = (RunContext(deps, 0, [], None),)
+            args = (run_context,)
         else:
             args = ()

pydantic_ai/agent.py CHANGED Viewed

@@ -22,7 +22,7 @@ from . import (
     result,
 )
 from .result import ResultData
-from .settings import ModelSettings, merge_model_settings
+from .settings import ModelSettings, UsageLimits, merge_model_settings
 from .tools import (
     AgentDeps,
     RunContext,
@@ -104,7 +104,6 @@ class Agent(Generic[AgentDeps, ResultData]):
     _system_prompt_functions: list[_system_prompt.SystemPromptRunner[AgentDeps]] = field(repr=False)
     _deps_type: type[AgentDeps] = field(repr=False)
     _max_result_retries: int = field(repr=False)
-    _current_result_retry: int = field(repr=False)
     _override_deps: _utils.Option[AgentDeps] = field(default=None, repr=False)
     _override_model: _utils.Option[models.Model] = field(default=None, repr=False)
@@ -180,7 +179,6 @@ class Agent(Generic[AgentDeps, ResultData]):
         self._deps_type = deps_type
         self._system_prompt_functions = []
         self._max_result_retries = result_retries if result_retries is not None else retries
-        self._current_result_retry = 0
         self._result_validators = []
     async def run(
@@ -191,6 +189,7 @@ class Agent(Generic[AgentDeps, ResultData]):
         model: models.Model | models.KnownModelName | None = None,
         deps: AgentDeps = None,
         model_settings: ModelSettings | None = None,
+        usage_limits: UsageLimits | None = None,
         infer_name: bool = True,
     ) -> result.RunResult[ResultData]:
         """Run the agent with a user prompt in async mode.
@@ -211,8 +210,9 @@ class Agent(Generic[AgentDeps, ResultData]):
             message_history: History of the conversation so far.
             model: Optional model to use for this run, required if `model` was not set when creating the agent.
             deps: Optional dependencies to use for this run.
-            infer_name: Whether to try to infer the agent name from the call frame if it's not set.
             model_settings: Optional settings to use for this model's request.
+            usage_limits: Optional limits on model request count or token usage.
+            infer_name: Whether to try to infer the agent name from the call frame if it's not set.
         Returns:
             The result of the run.
@@ -232,31 +232,37 @@ class Agent(Generic[AgentDeps, ResultData]):
             model_name=model_used.name(),
             agent_name=self.name or 'agent',
         ) as run_span:
-            self.last_run_messages = messages = await self._prepare_messages(deps, user_prompt, message_history)
+            run_context = RunContext(deps, 0, [], None, model_used)
+            messages = await self._prepare_messages(user_prompt, message_history, run_context)
+            self.last_run_messages = run_context.messages = messages
             for tool in self._function_tools.values():
                 tool.current_retry = 0
-            cost = result.Cost()
+            usage = result.Usage(requests=0)
             model_settings = merge_model_settings(self.model_settings, model_settings)
+            usage_limits = usage_limits or UsageLimits()
             run_step = 0
             while True:
+                usage_limits.check_before_request(usage)
                 run_step += 1
                 with _logfire.span('preparing model and tools {run_step=}', run_step=run_step):
-                    agent_model = await self._prepare_model(model_used, deps, messages)
+                    agent_model = await self._prepare_model(run_context)
                 with _logfire.span('model request', run_step=run_step) as model_req_span:
-                    model_response, request_cost = await agent_model.request(messages, model_settings)
+                    model_response, request_usage = await agent_model.request(messages, model_settings)
                     model_req_span.set_attribute('response', model_response)
-                    model_req_span.set_attribute('cost', request_cost)
+                    model_req_span.set_attribute('usage', request_usage)
                 messages.append(model_response)
-                cost += request_cost
+                usage += request_usage
+                usage.requests += 1
+                usage_limits.check_tokens(request_usage)
                 with _logfire.span('handle model response', run_step=run_step) as handle_span:
-                    final_result, tool_responses = await self._handle_model_response(model_response, deps, messages)
+                    final_result, tool_responses = await self._handle_model_response(model_response, run_context)
                     if tool_responses:
                         # Add parts to the conversation as a new message
@@ -266,10 +272,10 @@ class Agent(Generic[AgentDeps, ResultData]):
                     if final_result is not None:
                         result_data = final_result.data
                         run_span.set_attribute('all_messages', messages)
-                        run_span.set_attribute('cost', cost)
+                        run_span.set_attribute('usage', usage)
                         handle_span.set_attribute('result', result_data)
                         handle_span.message = 'handle model response -> final result'
-                        return result.RunResult(messages, new_message_index, result_data, cost)
+                        return result.RunResult(messages, new_message_index, result_data, usage)
                     else:
                         # continue the conversation
                         handle_span.set_attribute('tool_responses', tool_responses)
@@ -284,6 +290,7 @@ class Agent(Generic[AgentDeps, ResultData]):
         model: models.Model | models.KnownModelName | None = None,
         deps: AgentDeps = None,
         model_settings: ModelSettings | None = None,
+        usage_limits: UsageLimits | None = None,
         infer_name: bool = True,
     ) -> result.RunResult[ResultData]:
         """Run the agent with a user prompt synchronously.
@@ -308,8 +315,9 @@ class Agent(Generic[AgentDeps, ResultData]):
             message_history: History of the conversation so far.
             model: Optional model to use for this run, required if `model` was not set when creating the agent.
             deps: Optional dependencies to use for this run.
-            infer_name: Whether to try to infer the agent name from the call frame if it's not set.
             model_settings: Optional settings to use for this model's request.
+            usage_limits: Optional limits on model request count or token usage.
+            infer_name: Whether to try to infer the agent name from the call frame if it's not set.
         Returns:
             The result of the run.
@@ -322,8 +330,9 @@ class Agent(Generic[AgentDeps, ResultData]):
                 message_history=message_history,
                 model=model,
                 deps=deps,
-                infer_name=False,
                 model_settings=model_settings,
+                usage_limits=usage_limits,
+                infer_name=False,
             )
         )
@@ -336,6 +345,7 @@ class Agent(Generic[AgentDeps, ResultData]):
         model: models.Model | models.KnownModelName | None = None,
         deps: AgentDeps = None,
         model_settings: ModelSettings | None = None,
+        usage_limits: UsageLimits | None = None,
         infer_name: bool = True,
     ) -> AsyncIterator[result.StreamedRunResult[AgentDeps, ResultData]]:
         """Run the agent with a user prompt in async mode, returning a streamed response.
@@ -357,8 +367,9 @@ class Agent(Generic[AgentDeps, ResultData]):
             message_history: History of the conversation so far.
             model: Optional model to use for this run, required if `model` was not set when creating the agent.
             deps: Optional dependencies to use for this run.
-            infer_name: Whether to try to infer the agent name from the call frame if it's not set.
             model_settings: Optional settings to use for this model's request.
+            usage_limits: Optional limits on model request count or token usage.
+            infer_name: Whether to try to infer the agent name from the call frame if it's not set.
         Returns:
             The result of the run.
@@ -380,32 +391,35 @@ class Agent(Generic[AgentDeps, ResultData]):
             model_name=model_used.name(),
             agent_name=self.name or 'agent',
         ) as run_span:
-            self.last_run_messages = messages = await self._prepare_messages(deps, user_prompt, message_history)
+            run_context = RunContext(deps, 0, [], None, model_used)
+            messages = await self._prepare_messages(user_prompt, message_history, run_context)
+            self.last_run_messages = run_context.messages = messages
             for tool in self._function_tools.values():
                 tool.current_retry = 0
-            cost = result.Cost()
+            usage = result.Usage()
             model_settings = merge_model_settings(self.model_settings, model_settings)
+            usage_limits = usage_limits or UsageLimits()
             run_step = 0
             while True:
                 run_step += 1
+                usage_limits.check_before_request(usage)
                 with _logfire.span('preparing model and tools {run_step=}', run_step=run_step):
-                    agent_model = await self._prepare_model(model_used, deps, messages)
+                    agent_model = await self._prepare_model(run_context)
                 with _logfire.span('model request {run_step=}', run_step=run_step) as model_req_span:
                     async with agent_model.request_stream(messages, model_settings) as model_response:
+                        usage.requests += 1
                         model_req_span.set_attribute('response_type', model_response.__class__.__name__)
                         # We want to end the "model request" span here, but we can't exit the context manager
                         # in the traditional way
                         model_req_span.__exit__(None, None, None)
                         with _logfire.span('handle model response') as handle_span:
-                            maybe_final_result = await self._handle_streamed_model_response(
-                                model_response, deps, messages
-                            )
+                            maybe_final_result = await self._handle_streamed_model_response(model_response, run_context)
                             # Check if we got a final result
                             if isinstance(maybe_final_result, _MarkFinalResult):
@@ -425,7 +439,7 @@ class Agent(Generic[AgentDeps, ResultData]):
                                         part for part in last_message.parts if isinstance(part, _messages.ToolCallPart)
                                     ]
                                     parts = await self._process_function_tools(
-                                        tool_calls, result_tool_name, deps, messages
+                                        tool_calls, result_tool_name, run_context
                                     )
                                     if parts:
                                         messages.append(_messages.ModelRequest(parts))
@@ -434,10 +448,11 @@ class Agent(Generic[AgentDeps, ResultData]):
                                 yield result.StreamedRunResult(
                                     messages,
                                     new_message_index,
-                                    cost,
+                                    usage,
+                                    usage_limits,
                                     result_stream,
                                     self._result_schema,
-                                    deps,
+                                    run_context,
                                     self._result_validators,
                                     result_tool_name,
                                     on_complete,
@@ -455,8 +470,10 @@ class Agent(Generic[AgentDeps, ResultData]):
                                 handle_span.set_attribute('tool_responses', tool_responses)
                                 tool_responses_str = ' '.join(r.part_kind for r in tool_responses)
                                 handle_span.message = f'handle model response -> {tool_responses_str}'
-                                # the model_response should have been fully streamed by now, we can add it's cost
-                                cost += model_response.cost()
+                                # the model_response should have been fully streamed by now, we can add its usage
+                                model_response_usage = model_response.usage()
+                                usage += model_response_usage
+                                usage_limits.check_tokens(usage)
     @contextmanager
     def override(
@@ -798,41 +815,39 @@ class Agent(Generic[AgentDeps, ResultData]):
         return model_, mode_selection
-    async def _prepare_model(
-        self, model: models.Model, deps: AgentDeps, messages: list[_messages.ModelMessage]
-    ) -> models.AgentModel:
-        """Create building tools and create an agent model."""
+    async def _prepare_model(self, run_context: RunContext[AgentDeps]) -> models.AgentModel:
+        """Build tools and create an agent model."""
         function_tools: list[ToolDefinition] = []
         async def add_tool(tool: Tool[AgentDeps]) -> None:
-            ctx = RunContext(deps, tool.current_retry, messages, tool.name)
+            ctx = run_context.replace_with(retry=tool.current_retry, tool_name=tool.name)
             if tool_def := await tool.prepare_tool_def(ctx):
                 function_tools.append(tool_def)
         await asyncio.gather(*map(add_tool, self._function_tools.values()))
-        return await model.agent_model(
+        return await run_context.model.agent_model(
             function_tools=function_tools,
             allow_text_result=self._allow_text_result,
             result_tools=self._result_schema.tool_defs() if self._result_schema is not None else [],
         )
     async def _prepare_messages(
-        self, deps: AgentDeps, user_prompt: str, message_history: list[_messages.ModelMessage] | None
+        self, user_prompt: str, message_history: list[_messages.ModelMessage] | None, run_context: RunContext[AgentDeps]
     ) -> list[_messages.ModelMessage]:
         if message_history:
             # shallow copy messages
             messages = message_history.copy()
             messages.append(_messages.ModelRequest([_messages.UserPromptPart(user_prompt)]))
         else:
-            parts = await self._sys_parts(deps)
+            parts = await self._sys_parts(run_context)
             parts.append(_messages.UserPromptPart(user_prompt))
             messages: list[_messages.ModelMessage] = [_messages.ModelRequest(parts)]
         return messages
     async def _handle_model_response(
-        self, model_response: _messages.ModelResponse, deps: AgentDeps, conv_messages: list[_messages.ModelMessage]
+        self, model_response: _messages.ModelResponse, run_context: RunContext[AgentDeps]
     ) -> tuple[_MarkFinalResult[ResultData] | None, list[_messages.ModelRequestPart]]:
         """Process a non-streamed response from the model.
@@ -841,42 +856,44 @@ class Agent(Generic[AgentDeps, ResultData]):
         """
         texts: list[str] = []
         tool_calls: list[_messages.ToolCallPart] = []
-        for item in model_response.parts:
-            if isinstance(item, _messages.TextPart):
-                texts.append(item.content)
+        for part in model_response.parts:
+            if isinstance(part, _messages.TextPart):
+                # ignore empty content for text parts, see #437
+                if part.content:
+                    texts.append(part.content)
             else:
-                tool_calls.append(item)
+                tool_calls.append(part)
         if texts:
             text = '\n\n'.join(texts)
-            return await self._handle_text_response(text, deps, conv_messages)
+            return await self._handle_text_response(text, run_context)
         elif tool_calls:
-            return await self._handle_structured_response(tool_calls, deps, conv_messages)
+            return await self._handle_structured_response(tool_calls, run_context)
         else:
             raise exceptions.UnexpectedModelBehavior('Received empty model response')
     async def _handle_text_response(
-        self, text: str, deps: AgentDeps, conv_messages: list[_messages.ModelMessage]
+        self, text: str, run_context: RunContext[AgentDeps]
     ) -> tuple[_MarkFinalResult[ResultData] | None, list[_messages.ModelRequestPart]]:
         """Handle a plain text response from the model for non-streaming responses."""
         if self._allow_text_result:
             result_data_input = cast(ResultData, text)
             try:
-                result_data = await self._validate_result(result_data_input, deps, None, conv_messages)
+                result_data = await self._validate_result(result_data_input, run_context, None)
             except _result.ToolRetryError as e:
-                self._incr_result_retry()
+                self._incr_result_retry(run_context)
                 return None, [e.tool_retry]
             else:
                 return _MarkFinalResult(result_data, None), []
         else:
-            self._incr_result_retry()
+            self._incr_result_retry(run_context)
             response = _messages.RetryPromptPart(
                 content='Plain text responses are not permitted, please call one of the functions instead.',
             )
             return None, [response]
     async def _handle_structured_response(
-        self, tool_calls: list[_messages.ToolCallPart], deps: AgentDeps, conv_messages: list[_messages.ModelMessage]
+        self, tool_calls: list[_messages.ToolCallPart], run_context: RunContext[AgentDeps]
     ) -> tuple[_MarkFinalResult[ResultData] | None, list[_messages.ModelRequestPart]]:
         """Handle a structured response containing tool calls from the model for non-streaming responses."""
         assert tool_calls, 'Expected at least one tool call'
@@ -890,17 +907,15 @@ class Agent(Generic[AgentDeps, ResultData]):
                 call, result_tool = match
                 try:
                     result_data = result_tool.validate(call)
-                    result_data = await self._validate_result(result_data, deps, call, conv_messages)
+                    result_data = await self._validate_result(result_data, run_context, call)
                 except _result.ToolRetryError as e:
-                    self._incr_result_retry()
+                    self._incr_result_retry(run_context)
                     parts.append(e.tool_retry)
                 else:
                     final_result = _MarkFinalResult(result_data, call.tool_name)
         # Then build the other request parts based on end strategy
-        parts += await self._process_function_tools(
-            tool_calls, final_result and final_result.tool_name, deps, conv_messages
-        )
+        parts += await self._process_function_tools(tool_calls, final_result and final_result.tool_name, run_context)
         return final_result, parts
@@ -908,8 +923,7 @@ class Agent(Generic[AgentDeps, ResultData]):
         self,
         tool_calls: list[_messages.ToolCallPart],
         result_tool_name: str | None,
-        deps: AgentDeps,
-        conv_messages: list[_messages.ModelMessage],
+        run_context: RunContext[AgentDeps],
     ) -> list[_messages.ModelRequestPart]:
         """Process function (non-result) tool calls in parallel.
@@ -942,7 +956,7 @@ class Agent(Generic[AgentDeps, ResultData]):
                         )
                     )
                 else:
-                    tasks.append(asyncio.create_task(tool.run(deps, call, conv_messages), name=call.tool_name))
+                    tasks.append(asyncio.create_task(tool.run(call, run_context), name=call.tool_name))
             elif self._result_schema is not None and call.tool_name in self._result_schema.tools:
                 # if tool_name is in _result_schema, it means we found a result tool but an error occurred in
                 # validation, we don't add another part here
@@ -955,7 +969,7 @@ class Agent(Generic[AgentDeps, ResultData]):
                         )
                     )
             else:
-                parts.append(self._unknown_tool(call.tool_name))
+                parts.append(self._unknown_tool(call.tool_name, run_context))
         # Run all tool tasks in parallel
         if tasks:
@@ -967,8 +981,7 @@ class Agent(Generic[AgentDeps, ResultData]):
     async def _handle_streamed_model_response(
         self,
         model_response: models.EitherStreamedResponse,
-        deps: AgentDeps,
-        conv_messages: list[_messages.ModelMessage],
+        run_context: RunContext[AgentDeps],
     ) -> (
         _MarkFinalResult[models.EitherStreamedResponse]
         | tuple[_messages.ModelResponse, list[_messages.ModelRequestPart]]
@@ -984,11 +997,11 @@ class Agent(Generic[AgentDeps, ResultData]):
             if self._allow_text_result:
                 return _MarkFinalResult(model_response, None)
             else:
-                self._incr_result_retry()
+                self._incr_result_retry(run_context)
                 response = _messages.RetryPromptPart(
                     content='Plain text responses are not permitted, please call one of the functions instead.',
                 )
-                # stream the response, so cost is correct
+                # stream the response, so usage is correct
                 async for _ in model_response:
                     pass
@@ -1024,9 +1037,9 @@ class Agent(Generic[AgentDeps, ResultData]):
                 if isinstance(item, _messages.ToolCallPart):
                     call = item
                     if tool := self._function_tools.get(call.tool_name):
-                        tasks.append(asyncio.create_task(tool.run(deps, call, conv_messages), name=call.tool_name))
+                        tasks.append(asyncio.create_task(tool.run(call, run_context), name=call.tool_name))
                     else:
-                        parts.append(self._unknown_tool(call.tool_name))
+                        parts.append(self._unknown_tool(call.tool_name, run_context))
             with _logfire.span('running {tools=}', tools=[t.get_name() for t in tasks]):
                 task_results: Sequence[_messages.ModelRequestPart] = await asyncio.gather(*tasks)
@@ -1038,33 +1051,30 @@ class Agent(Generic[AgentDeps, ResultData]):
     async def _validate_result(
         self,
         result_data: ResultData,
-        deps: AgentDeps,
+        run_context: RunContext[AgentDeps],
         tool_call: _messages.ToolCallPart | None,
-        conv_messages: list[_messages.ModelMessage],
     ) -> ResultData:
         for validator in self._result_validators:
-            result_data = await validator.validate(
-                result_data, deps, self._current_result_retry, tool_call, conv_messages
-            )
+            result_data = await validator.validate(result_data, tool_call, run_context)
         return result_data
-    def _incr_result_retry(self) -> None:
-        self._current_result_retry += 1
-        if self._current_result_retry > self._max_result_retries:
+    def _incr_result_retry(self, run_context: RunContext[AgentDeps]) -> None:
+        run_context.retry += 1
+        if run_context.retry > self._max_result_retries:
             raise exceptions.UnexpectedModelBehavior(
                 f'Exceeded maximum retries ({self._max_result_retries}) for result validation'
             )
-    async def _sys_parts(self, deps: AgentDeps) -> list[_messages.ModelRequestPart]:
+    async def _sys_parts(self, run_context: RunContext[AgentDeps]) -> list[_messages.ModelRequestPart]:
         """Build the initial messages for the conversation."""
         messages: list[_messages.ModelRequestPart] = [_messages.SystemPromptPart(p) for p in self._system_prompts]
         for sys_prompt_runner in self._system_prompt_functions:
-            prompt = await sys_prompt_runner.run(deps)
+            prompt = await sys_prompt_runner.run(run_context)
             messages.append(_messages.SystemPromptPart(prompt))
         return messages
-    def _unknown_tool(self, tool_name: str) -> _messages.RetryPromptPart:
-        self._incr_result_retry()
+    def _unknown_tool(self, tool_name: str, run_context: RunContext[AgentDeps]) -> _messages.RetryPromptPart:
+        self._incr_result_retry(run_context)
         names = list(self._function_tools.keys())
         if self._result_schema:
             names.extend(self._result_schema.tool_names())

pydantic_ai/exceptions.py CHANGED Viewed

@@ -2,7 +2,7 @@ from __future__ import annotations as _annotations
 import json
-__all__ = 'ModelRetry', 'UserError', 'UnexpectedModelBehavior'
+__all__ = 'ModelRetry', 'UserError', 'AgentRunError', 'UnexpectedModelBehavior', 'UsageLimitExceeded'
 class ModelRetry(Exception):
@@ -30,7 +30,25 @@ class UserError(RuntimeError):
         super().__init__(message)
-class UnexpectedModelBehavior(RuntimeError):
+class AgentRunError(RuntimeError):
+    """Base class for errors occurring during an agent run."""
+    message: str
+    """The error message."""
+    def __init__(self, message: str):
+        self.message = message
+        super().__init__(message)
+    def __str__(self) -> str:
+        return self.message
+class UsageLimitExceeded(AgentRunError):
+    """Error raised when a Model's usage exceeds the specified limits."""
+class UnexpectedModelBehavior(AgentRunError):
     """Error caused by unexpected Model behavior, e.g. an unexpected response code."""
     message: str

pydantic_ai/messages.py CHANGED Viewed

@@ -2,11 +2,11 @@ from __future__ import annotations as _annotations
 from dataclasses import dataclass, field
 from datetime import datetime
-from typing import Annotated, Any, Literal, Union
+from typing import Annotated, Any, Literal, Union, cast
 import pydantic
 import pydantic_core
-from typing_extensions import Self
+from typing_extensions import Self, assert_never
 from ._utils import now_utc as _now_utc
@@ -190,12 +190,34 @@ class ToolCallPart:
     """Part type identifier, this is available on all parts as a discriminator."""
     @classmethod
-    def from_json(cls, tool_name: str, args_json: str, tool_call_id: str | None = None) -> Self:
-        return cls(tool_name, ArgsJson(args_json), tool_call_id)
+    def from_raw_args(cls, tool_name: str, args: str | dict[str, Any], tool_call_id: str | None = None) -> Self:
+        """Create a `ToolCallPart` from raw arguments."""
+        if isinstance(args, str):
+            return cls(tool_name, ArgsJson(args), tool_call_id)
+        elif isinstance(args, dict):
+            return cls(tool_name, ArgsDict(args), tool_call_id)
+        else:
+            assert_never(args)
-    @classmethod
-    def from_dict(cls, tool_name: str, args_dict: dict[str, Any], tool_call_id: str | None = None) -> Self:
-        return cls(tool_name, ArgsDict(args_dict), tool_call_id)
+    def args_as_dict(self) -> dict[str, Any]:
+        """Return the arguments as a Python dictionary.
+        This is just for convenience with models that require dicts as input.
+        """
+        if isinstance(self.args, ArgsDict):
+            return self.args.args_dict
+        args = pydantic_core.from_json(self.args.args_json)
+        assert isinstance(args, dict), 'args should be a dict'
+        return cast(dict[str, Any], args)
+    def args_as_json_str(self) -> str:
+        """Return the arguments as a JSON string.
+        This is just for convenience with models that require JSON strings as input.
+        """
+        if isinstance(self.args, ArgsJson):
+            return self.args.args_json
+        return pydantic_core.to_json(self.args.args_dict).decode()
     def has_content(self) -> bool:
         if isinstance(self.args, ArgsDict):

pydantic-ai-slim 0.0.13__py3-none-any.whl → 0.0.14__py3-none-any.whl

Potentially problematic release.

pydantic-ai-slim 0.0.13py3-none-any.whl → 0.0.14py3-none-any.whl