PyPI - pydantic-ai-slim - Versions diffs - 0.8.0__py3-none-any.whl → 1.0.0__py3-none-any.whl - Mend

pydantic-ai-slim 0.8.0py3-none-any.whl → 1.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of pydantic-ai-slim might be problematic. Click here for more details.

Files changed (75) hide show

pydantic_ai/__init__.py +28 -2
pydantic_ai/_a2a.py +1 -1
pydantic_ai/_agent_graph.py +323 -156
pydantic_ai/_function_schema.py +5 -5
pydantic_ai/_griffe.py +2 -1
pydantic_ai/_otel_messages.py +2 -2
pydantic_ai/_output.py +31 -35
pydantic_ai/_parts_manager.py +7 -5
pydantic_ai/_run_context.py +3 -1
pydantic_ai/_system_prompt.py +2 -2
pydantic_ai/_tool_manager.py +32 -28
pydantic_ai/_utils.py +14 -26
pydantic_ai/ag_ui.py +82 -51
pydantic_ai/agent/__init__.py +84 -17
pydantic_ai/agent/abstract.py +35 -4
pydantic_ai/agent/wrapper.py +6 -0
pydantic_ai/builtin_tools.py +2 -2
pydantic_ai/common_tools/duckduckgo.py +4 -2
pydantic_ai/durable_exec/temporal/__init__.py +70 -17
pydantic_ai/durable_exec/temporal/_agent.py +93 -11
pydantic_ai/durable_exec/temporal/_function_toolset.py +53 -6
pydantic_ai/durable_exec/temporal/_logfire.py +6 -3
pydantic_ai/durable_exec/temporal/_mcp_server.py +2 -1
pydantic_ai/durable_exec/temporal/_model.py +2 -2
pydantic_ai/durable_exec/temporal/_run_context.py +2 -1
pydantic_ai/durable_exec/temporal/_toolset.py +2 -1
pydantic_ai/exceptions.py +45 -2
pydantic_ai/format_prompt.py +2 -2
pydantic_ai/mcp.py +15 -27
pydantic_ai/messages.py +156 -44
pydantic_ai/models/__init__.py +20 -7
pydantic_ai/models/anthropic.py +10 -17
pydantic_ai/models/bedrock.py +55 -57
pydantic_ai/models/cohere.py +3 -3
pydantic_ai/models/fallback.py +2 -2
pydantic_ai/models/function.py +25 -23
pydantic_ai/models/gemini.py +13 -14
pydantic_ai/models/google.py +19 -5
pydantic_ai/models/groq.py +127 -39
pydantic_ai/models/huggingface.py +5 -5
pydantic_ai/models/instrumented.py +49 -21
pydantic_ai/models/mcp_sampling.py +3 -1
pydantic_ai/models/mistral.py +8 -8
pydantic_ai/models/openai.py +37 -42
pydantic_ai/models/test.py +24 -4
pydantic_ai/output.py +27 -32
pydantic_ai/profiles/__init__.py +3 -3
pydantic_ai/profiles/groq.py +1 -1
pydantic_ai/profiles/openai.py +25 -4
pydantic_ai/providers/__init__.py +4 -0
pydantic_ai/providers/anthropic.py +2 -3
pydantic_ai/providers/bedrock.py +3 -2
pydantic_ai/providers/google_vertex.py +2 -1
pydantic_ai/providers/groq.py +21 -2
pydantic_ai/providers/litellm.py +134 -0
pydantic_ai/result.py +173 -52
pydantic_ai/retries.py +52 -31
pydantic_ai/run.py +12 -5
pydantic_ai/tools.py +127 -23
pydantic_ai/toolsets/__init__.py +4 -1
pydantic_ai/toolsets/_dynamic.py +4 -4
pydantic_ai/toolsets/abstract.py +18 -2
pydantic_ai/toolsets/approval_required.py +32 -0
pydantic_ai/toolsets/combined.py +7 -12
pydantic_ai/toolsets/{deferred.py → external.py} +11 -5
pydantic_ai/toolsets/filtered.py +1 -1
pydantic_ai/toolsets/function.py +58 -21
pydantic_ai/toolsets/wrapper.py +2 -1
pydantic_ai/usage.py +44 -8
{pydantic_ai_slim-0.8.0.dist-info → pydantic_ai_slim-1.0.0.dist-info}/METADATA +8 -9
pydantic_ai_slim-1.0.0.dist-info/RECORD +121 -0
pydantic_ai_slim-0.8.0.dist-info/RECORD +0 -119
{pydantic_ai_slim-0.8.0.dist-info → pydantic_ai_slim-1.0.0.dist-info}/WHEEL +0 -0
{pydantic_ai_slim-0.8.0.dist-info → pydantic_ai_slim-1.0.0.dist-info}/entry_points.txt +0 -0
{pydantic_ai_slim-0.8.0.dist-info → pydantic_ai_slim-1.0.0.dist-info}/licenses/LICENSE +0 -0

pydantic_ai/_agent_graph.py CHANGED Viewed

@@ -2,16 +2,15 @@ from __future__ import annotations as _annotations
 import asyncio
 import dataclasses
-import hashlib
 from collections import defaultdict, deque
-from collections.abc import AsyncIterator, Awaitable, Iterator, Sequence
+from collections.abc import AsyncIterator, Awaitable, Callable, Iterator, Sequence
 from contextlib import asynccontextmanager, contextmanager
 from contextvars import ContextVar
 from dataclasses import field
-from typing import TYPE_CHECKING, Any, Callable, Generic, Literal, Union, cast
+from typing import TYPE_CHECKING, Any, Generic, Literal, TypeGuard, cast
 from opentelemetry.trace import Tracer
-from typing_extensions import TypeGuard, TypeVar, assert_never
+from typing_extensions import TypeVar, assert_never
 from pydantic_ai._function_schema import _takes_ctx as is_takes_ctx  # type: ignore
 from pydantic_ai._tool_manager import ToolManager
@@ -24,7 +23,14 @@ from . import _output, _system_prompt, exceptions, messages as _messages, models
 from .exceptions import ToolRetryError
 from .output import OutputDataT, OutputSpec
 from .settings import ModelSettings
-from .tools import RunContext, ToolDefinition, ToolKind
+from .tools import (
+    DeferredToolResult,
+    RunContext,
+    ToolApproved,
+    ToolDefinition,
+    ToolDenied,
+    ToolKind,
+)
 if TYPE_CHECKING:
     from .models.instrumented import InstrumentationSettings
@@ -59,19 +65,19 @@ _HistoryProcessorSyncWithCtx = Callable[[RunContext[DepsT], list[_messages.Model
 _HistoryProcessorAsyncWithCtx = Callable[
     [RunContext[DepsT], list[_messages.ModelMessage]], Awaitable[list[_messages.ModelMessage]]
 ]
-HistoryProcessor = Union[
-    _HistoryProcessorSync,
-    _HistoryProcessorAsync,
-    _HistoryProcessorSyncWithCtx[DepsT],
-    _HistoryProcessorAsyncWithCtx[DepsT],
-]
+HistoryProcessor = (
+    _HistoryProcessorSync
+    | _HistoryProcessorAsync
+    | _HistoryProcessorSyncWithCtx[DepsT]
+    | _HistoryProcessorAsyncWithCtx[DepsT]
+)
 """A function that processes a list of model messages and returns a list of model messages.
 Can optionally accept a `RunContext` as a parameter.
 """
-@dataclasses.dataclass
+@dataclasses.dataclass(kw_only=True)
 class GraphAgentState:
     """State kept across the execution of the agent graph."""
@@ -92,7 +98,7 @@ class GraphAgentState:
                 raise exceptions.UnexpectedModelBehavior(message)
-@dataclasses.dataclass
+@dataclasses.dataclass(kw_only=True)
 class GraphAgentDeps(Generic[DepsT, OutputDataT]):
     """Dependencies/config passed to the agent graph."""
@@ -115,9 +121,10 @@ class GraphAgentDeps(Generic[DepsT, OutputDataT]):
     builtin_tools: list[AbstractBuiltinTool] = dataclasses.field(repr=False)
     tool_manager: ToolManager[DepsT]
+    tool_call_results: dict[str, DeferredToolResult] | None
     tracer: Tracer
-    instrumentation_settings: InstrumentationSettings | None = None
+    instrumentation_settings: InstrumentationSettings | None
 class AgentNode(BaseNode[GraphAgentState, GraphAgentDeps[DepsT, Any], result.FinalResult[NodeRunEndT]]):
@@ -149,6 +156,8 @@ class UserPromptNode(AgentNode[DepsT, NodeRunEndT]):
     user_prompt: str | Sequence[_messages.UserContent] | None
+    _: dataclasses.KW_ONLY
     instructions: str | None
     instructions_functions: list[_system_prompt.SystemPromptRunner[DepsT]]
@@ -158,7 +167,7 @@ class UserPromptNode(AgentNode[DepsT, NodeRunEndT]):
     async def run(
         self, ctx: GraphRunContext[GraphAgentState, GraphAgentDeps[DepsT, NodeRunEndT]]
-    ) -> Union[ModelRequestNode[DepsT, NodeRunEndT], CallToolsNode[DepsT, NodeRunEndT]]:  # noqa UP007
+    ) -> ModelRequestNode[DepsT, NodeRunEndT] | CallToolsNode[DepsT, NodeRunEndT]:
         try:
             ctx_messages = get_captured_run_messages()
         except LookupError:
@@ -184,26 +193,29 @@ class UserPromptNode(AgentNode[DepsT, NodeRunEndT]):
         else:
             parts.extend(await self._sys_parts(run_context))
+        if (tool_call_results := ctx.deps.tool_call_results) is not None:
+            if messages and (last_message := messages[-1]) and isinstance(last_message, _messages.ModelRequest):
+                # If tool call results were provided, that means the previous run ended on deferred tool calls.
+                # That run would typically have ended on a `ModelResponse`, but if it had a mix of deferred tool calls and ones that could already be executed,
+                # a `ModelRequest` would already have been added to the history with the preliminary results, even if it wouldn't have been sent to the model yet.
+                # So now that we have all of the deferred results, we roll back to the last `ModelResponse` and store the contents of the `ModelRequest` on `deferred_tool_results` to be handled by `CallToolsNode`.
+                ctx.deps.tool_call_results = self._update_tool_call_results_from_model_request(
+                    tool_call_results, last_message
+                )
+                messages.pop()
+            if not messages:
+                raise exceptions.UserError('Tool call results were provided, but the message history is empty.')
         if messages and (last_message := messages[-1]):
             if isinstance(last_message, _messages.ModelRequest) and self.user_prompt is None:
                 # Drop last message from history and reuse its parts
                 messages.pop()
                 parts.extend(last_message.parts)
             elif isinstance(last_message, _messages.ModelResponse):
-                if self.user_prompt is None:
-                    # `CallToolsNode` requires the tool manager to be prepared for the run step
-                    # This will raise errors for any tool name conflicts
-                    ctx.deps.tool_manager = await ctx.deps.tool_manager.for_run_step(run_context)
-                    # Skip ModelRequestNode and go directly to CallToolsNode
-                    return CallToolsNode[DepsT, NodeRunEndT](model_response=last_message)
-                elif any(isinstance(part, _messages.ToolCallPart) for part in last_message.parts):
-                    raise exceptions.UserError(
-                        'Cannot provide a new user prompt when the message history ends with '
-                        'a model response containing unprocessed tool calls. Either process the '
-                        'tool calls first (by calling `iter` with `user_prompt=None`) or append a '
-                        '`ModelRequest` with `ToolResultPart`s.'
-                    )
+                call_tools_node = await self._handle_message_history_model_response(ctx, last_message)
+                if call_tools_node is not None:
+                    return call_tools_node
         if self.user_prompt is not None:
             parts.append(_messages.UserPromptPart(self.user_prompt))
@@ -213,6 +225,74 @@ class UserPromptNode(AgentNode[DepsT, NodeRunEndT]):
         return ModelRequestNode[DepsT, NodeRunEndT](request=next_message)
+    async def _handle_message_history_model_response(
+        self,
+        ctx: GraphRunContext[GraphAgentState, GraphAgentDeps[DepsT, NodeRunEndT]],
+        message: _messages.ModelResponse,
+    ) -> CallToolsNode[DepsT, NodeRunEndT] | None:
+        unprocessed_tool_calls = any(isinstance(part, _messages.ToolCallPart) for part in message.parts)
+        if unprocessed_tool_calls:
+            if self.user_prompt is not None:
+                raise exceptions.UserError(
+                    'Cannot provide a new user prompt when the message history contains unprocessed tool calls.'
+                )
+        else:
+            if ctx.deps.tool_call_results is not None:
+                raise exceptions.UserError(
+                    'Tool call results were provided, but the message history does not contain any unprocessed tool calls.'
+                )
+        if unprocessed_tool_calls or self.user_prompt is None:
+            # `CallToolsNode` requires the tool manager to be prepared for the run step
+            # This will raise errors for any tool name conflicts
+            run_context = build_run_context(ctx)
+            ctx.deps.tool_manager = await ctx.deps.tool_manager.for_run_step(run_context)
+            # Skip ModelRequestNode and go directly to CallToolsNode
+            return CallToolsNode[DepsT, NodeRunEndT](model_response=message)
+    def _update_tool_call_results_from_model_request(
+        self, tool_call_results: dict[str, DeferredToolResult], message: _messages.ModelRequest
+    ) -> dict[str, DeferredToolResult]:
+        last_tool_return: _messages.ToolReturn | None = None
+        user_content: list[str | _messages.UserContent] = []
+        for part in message.parts:
+            if isinstance(part, _messages.ToolReturnPart):
+                if part.tool_call_id in tool_call_results:
+                    raise exceptions.UserError(
+                        f'Tool call {part.tool_call_id!r} was already executed and its result cannot be overridden.'
+                    )
+                last_tool_return = _messages.ToolReturn(return_value=part.content, metadata=part.metadata)
+                tool_call_results[part.tool_call_id] = last_tool_return
+            elif isinstance(part, _messages.RetryPromptPart):
+                if part.tool_call_id in tool_call_results:
+                    raise exceptions.UserError(
+                        f'Tool call {part.tool_call_id!r} was already executed and its result cannot be overridden.'
+                    )
+                tool_call_results[part.tool_call_id] = part
+            elif isinstance(part, _messages.UserPromptPart):
+                # Tools can return user parts via `ToolReturn.content` or by returning multi-modal content.
+                # These go together with a specific `ToolReturnPart`, but we don't have a way to know which,
+                # so (below) we just add them to the last one, matching the tool-results-before-user-parts order of the request.
+                if isinstance(part.content, str):
+                    user_content.append(part.content)
+                else:
+                    user_content.extend(part.content)
+            else:
+                raise exceptions.UserError(f'Unexpected message part type: {type(part)}')  # pragma: no cover
+        if user_content:
+            if last_tool_return is None:
+                raise exceptions.UserError(
+                    'Tool call results were provided, but the last message in the history was a `ModelRequest` with user parts not tied to preliminary tool results.'
+                )
+            assert last_tool_return is not None
+            last_tool_return.content = user_content
+        return tool_call_results
     async def _reevaluate_dynamic_prompts(
         self, messages: list[_messages.ModelMessage], run_context: RunContext[DepsT]
     ) -> None:
@@ -221,16 +301,21 @@ class UserPromptNode(AgentNode[DepsT, NodeRunEndT]):
         if self.system_prompt_dynamic_functions:
             for msg in messages:
                 if isinstance(msg, _messages.ModelRequest):
-                    for i, part in enumerate(msg.parts):
+                    reevaluated_message_parts: list[_messages.ModelRequestPart] = []
+                    for part in msg.parts:
                         if isinstance(part, _messages.SystemPromptPart) and part.dynamic_ref:
                             # Look up the runner by its ref
                             if runner := self.system_prompt_dynamic_functions.get(  # pragma: lax no cover
                                 part.dynamic_ref
                             ):
                                 updated_part_content = await runner.run(run_context)
-                                msg.parts[i] = _messages.SystemPromptPart(
-                                    updated_part_content, dynamic_ref=part.dynamic_ref
-                                )
+                                part = _messages.SystemPromptPart(updated_part_content, dynamic_ref=part.dynamic_ref)
+                        reevaluated_message_parts.append(part)
+                    # Replace message parts with reevaluated ones to prevent mutating parts list
+                    if reevaluated_message_parts != msg.parts:
+                        msg.parts = reevaluated_message_parts
     async def _sys_parts(self, run_context: RunContext[DepsT]) -> list[_messages.ModelRequestPart]:
         """Build the initial messages for the conversation."""
@@ -280,8 +365,8 @@ class ModelRequestNode(AgentNode[DepsT, NodeRunEndT]):
     request: _messages.ModelRequest
-    _result: CallToolsNode[DepsT, NodeRunEndT] | None = field(default=None, repr=False)
-    _did_stream: bool = field(default=False, repr=False)
+    _result: CallToolsNode[DepsT, NodeRunEndT] | None = field(repr=False, init=False, default=None)
+    _did_stream: bool = field(repr=False, init=False, default=False)
     async def run(
         self, ctx: GraphRunContext[GraphAgentState, GraphAgentDeps[DepsT, NodeRunEndT]]
@@ -310,13 +395,13 @@ class ModelRequestNode(AgentNode[DepsT, NodeRunEndT]):
             self._did_stream = True
             ctx.state.usage.requests += 1
             agent_stream = result.AgentStream[DepsT, T](
-                streamed_response,
-                ctx.deps.output_schema,
-                model_request_parameters,
-                ctx.deps.output_validators,
-                build_run_context(ctx),
-                ctx.deps.usage_limits,
-                ctx.deps.tool_manager,
+                _raw_stream_response=streamed_response,
+                _output_schema=ctx.deps.output_schema,
+                _model_request_parameters=model_request_parameters,
+                _output_validators=ctx.deps.output_validators,
+                _run_ctx=build_run_context(ctx),
+                _usage_limits=ctx.deps.usage_limits,
+                _tool_manager=ctx.deps.tool_manager,
             )
             yield agent_stream
             # In case the user didn't manually consume the full stream, ensure it is fully consumed here,
@@ -396,14 +481,14 @@ class CallToolsNode(AgentNode[DepsT, NodeRunEndT]):
     model_response: _messages.ModelResponse
-    _events_iterator: AsyncIterator[_messages.HandleResponseEvent] | None = field(default=None, repr=False)
+    _events_iterator: AsyncIterator[_messages.HandleResponseEvent] | None = field(default=None, init=False, repr=False)
     _next_node: ModelRequestNode[DepsT, NodeRunEndT] | End[result.FinalResult[NodeRunEndT]] | None = field(
-        default=None, repr=False
+        default=None, init=False, repr=False
     )
     async def run(
         self, ctx: GraphRunContext[GraphAgentState, GraphAgentDeps[DepsT, NodeRunEndT]]
-    ) -> Union[ModelRequestNode[DepsT, NodeRunEndT], End[result.FinalResult[NodeRunEndT]]]:  # noqa UP007
+    ) -> ModelRequestNode[DepsT, NodeRunEndT] | End[result.FinalResult[NodeRunEndT]]:
         async with self.stream(ctx):
             pass
         assert self._next_node is not None, 'the stream should set `self._next_node` before it ends'
@@ -506,13 +591,6 @@ class CallToolsNode(AgentNode[DepsT, NodeRunEndT]):
         if output_final_result:
             final_result = output_final_result[0]
             self._next_node = self._handle_final_result(ctx, final_result, output_parts)
-        elif deferred_tool_calls := ctx.deps.tool_manager.get_deferred_tool_calls(tool_calls):
-            if not ctx.deps.output_schema.allows_deferred_tool_calls:
-                raise exceptions.UserError(
-                    'A deferred tool call was present, but `DeferredToolCalls` is not among output types. To resolve this, add `DeferredToolCalls` to the list of output types for this agent.'
-                )
-            final_result = result.FinalResult(cast(NodeRunEndT, deferred_tool_calls), None, None)
-            self._next_node = self._handle_final_result(ctx, final_result, output_parts)
         else:
             instructions = await ctx.deps.get_instructions(run_context)
             self._next_node = ModelRequestNode[DepsT, NodeRunEndT](
@@ -557,7 +635,7 @@ class CallToolsNode(AgentNode[DepsT, NodeRunEndT]):
             ctx.state.increment_retries(ctx.deps.max_result_retries, e)
             return ModelRequestNode[DepsT, NodeRunEndT](_messages.ModelRequest(parts=[e.tool_retry]))
         else:
-            return self._handle_final_result(ctx, result.FinalResult(result_data, None, None), [])
+            return self._handle_final_result(ctx, result.FinalResult(result_data), [])
 def build_run_context(ctx: GraphRunContext[GraphAgentState, GraphAgentDeps[DepsT, Any]]) -> RunContext[DepsT]:
@@ -572,16 +650,10 @@ def build_run_context(ctx: GraphRunContext[GraphAgentState, GraphAgentDeps[DepsT
         trace_include_content=ctx.deps.instrumentation_settings is not None
         and ctx.deps.instrumentation_settings.include_content,
         run_step=ctx.state.run_step,
+        tool_call_approved=ctx.state.run_step == 0 and ctx.deps.tool_call_results is not None,
     )
-def multi_modal_content_identifier(identifier: str | bytes) -> str:
-    """Generate stable identifier for multi-modal content to help LLM in finding a specific file in tool call responses."""
-    if isinstance(identifier, str):
-        identifier = identifier.encode('utf-8')
-    return hashlib.sha1(identifier).hexdigest()[:6]
 async def process_function_tools(  # noqa: C901
     tool_manager: ToolManager[DepsT],
     tool_calls: list[_messages.ToolCallPart],
@@ -599,7 +671,10 @@ async def process_function_tools(  # noqa: C901
     tool_calls_by_kind: dict[ToolKind | Literal['unknown'], list[_messages.ToolCallPart]] = defaultdict(list)
     for call in tool_calls:
         tool_def = tool_manager.get_tool_def(call.tool_name)
-        kind = tool_def.kind if tool_def else 'unknown'
+        if tool_def:
+            kind = tool_def.kind
+        else:
+            kind = 'unknown'
         tool_calls_by_kind[kind].append(call)
     # First, we handle output tool calls
@@ -662,132 +737,224 @@ async def process_function_tools(  # noqa: C901
         ctx.state.increment_retries(ctx.deps.max_result_retries)
         calls_to_run.extend(tool_calls_by_kind['unknown'])
-    for call in calls_to_run:
-        yield _messages.FunctionToolCallEvent(call)
+    deferred_tool_results: dict[str, DeferredToolResult] = {}
+    if build_run_context(ctx).tool_call_approved and ctx.deps.tool_call_results is not None:
+        deferred_tool_results = ctx.deps.tool_call_results
-    user_parts_by_index: dict[int, list[_messages.UserPromptPart]] = defaultdict(list)
+        # Deferred tool calls are "run" as well, by reading their value from the tool call results
+        calls_to_run.extend(tool_calls_by_kind['external'])
+        calls_to_run.extend(tool_calls_by_kind['unapproved'])
-    if calls_to_run:
-        # Run all tool tasks in parallel
-        tool_parts_by_index: dict[int, _messages.ModelRequestPart] = {}
-        with ctx.deps.tracer.start_as_current_span(
-            'running tools',
-            attributes={
-                'tools': [call.tool_name for call in calls_to_run],
-                'logfire.msg': f'running {len(calls_to_run)} tool{"" if len(calls_to_run) == 1 else "s"}',
-            },
-        ):
-            tasks = [
-                asyncio.create_task(_call_function_tool(tool_manager, call), name=call.tool_name)
-                for call in calls_to_run
-            ]
-            pending = tasks
-            while pending:
-                done, pending = await asyncio.wait(pending, return_when=asyncio.FIRST_COMPLETED)
-                for task in done:
-                    index = tasks.index(task)
-                    tool_part, tool_user_parts = task.result()
-                    yield _messages.FunctionToolResultEvent(tool_part)
+        result_tool_call_ids = set(deferred_tool_results.keys())
+        tool_call_ids_to_run = {call.tool_call_id for call in calls_to_run}
+        if tool_call_ids_to_run != result_tool_call_ids:
+            raise exceptions.UserError(
+                'Tool call results need to be provided for all deferred tool calls. '
+                f'Expected: {tool_call_ids_to_run}, got: {result_tool_call_ids}'
+            )
-                    tool_parts_by_index[index] = tool_part
-                    user_parts_by_index[index] = tool_user_parts
+    deferred_calls: dict[Literal['external', 'unapproved'], list[_messages.ToolCallPart]] = defaultdict(list)
-        # We append the results at the end, rather than as they are received, to retain a consistent ordering
-        # This is mostly just to simplify testing
-        for k in sorted(tool_parts_by_index):
-            output_parts.append(tool_parts_by_index[k])
+    if calls_to_run:
+        async for event in _call_tools(
+            tool_manager,
+            calls_to_run,
+            deferred_tool_results,
+            ctx.deps.tracer,
+            ctx.deps.usage_limits,
+            output_parts,
+            deferred_calls,
+        ):
+            yield event
-    # Finally, we handle deferred tool calls
-    for call in tool_calls_by_kind['deferred']:
+    # Finally, we handle deferred tool calls (unless they were already included in the run because results were provided)
+    if not deferred_tool_results:
         if final_result:
-            output_parts.append(
-                _messages.ToolReturnPart(
-                    tool_name=call.tool_name,
-                    content='Tool not executed - a final result was already processed.',
-                    tool_call_id=call.tool_call_id,
+            for call in [*tool_calls_by_kind['external'], *tool_calls_by_kind['unapproved']]:
+                output_parts.append(
+                    _messages.ToolReturnPart(
+                        tool_name=call.tool_name,
+                        content='Tool not executed - a final result was already processed.',
+                        tool_call_id=call.tool_call_id,
+                    )
                 )
-            )
         else:
-            yield _messages.FunctionToolCallEvent(call)
+            for call in tool_calls_by_kind['external']:
+                deferred_calls['external'].append(call)
+                yield _messages.FunctionToolCallEvent(call)
-    for k in sorted(user_parts_by_index):
-        output_parts.extend(user_parts_by_index[k])
+            for call in tool_calls_by_kind['unapproved']:
+                deferred_calls['unapproved'].append(call)
+                yield _messages.FunctionToolCallEvent(call)
+    if not final_result and deferred_calls:
+        if not ctx.deps.output_schema.allows_deferred_tools:
+            raise exceptions.UserError(
+                'A deferred tool call was present, but `DeferredToolRequests` is not among output types. To resolve this, add `DeferredToolRequests` to the list of output types for this agent.'
+            )
+        deferred_tool_requests = _output.DeferredToolRequests(
+            calls=deferred_calls['external'],
+            approvals=deferred_calls['unapproved'],
+        )
+        final_result = result.FinalResult(cast(NodeRunEndT, deferred_tool_requests), None, None)
     if final_result:
         output_final_result.append(final_result)
-async def _call_function_tool(
+async def _call_tools(
     tool_manager: ToolManager[DepsT],
-    tool_call: _messages.ToolCallPart,
-) -> tuple[_messages.ToolReturnPart | _messages.RetryPromptPart, list[_messages.UserPromptPart]]:
-    try:
-        tool_result = await tool_manager.handle_call(tool_call)
-    except ToolRetryError as e:
-        return (e.tool_retry, [])
+    tool_calls: list[_messages.ToolCallPart],
+    deferred_tool_results: dict[str, DeferredToolResult],
+    tracer: Tracer,
+    usage_limits: _usage.UsageLimits | None,
+    output_parts: list[_messages.ModelRequestPart],
+    output_deferred_calls: dict[Literal['external', 'unapproved'], list[_messages.ToolCallPart]],
+) -> AsyncIterator[_messages.HandleResponseEvent]:
+    tool_parts_by_index: dict[int, _messages.ModelRequestPart] = {}
+    user_parts_by_index: dict[int, _messages.UserPromptPart] = {}
+    deferred_calls_by_index: dict[int, Literal['external', 'unapproved']] = {}
-    tool_part = _messages.ToolReturnPart(
-        tool_name=tool_call.tool_name,
-        content=tool_result,
-        tool_call_id=tool_call.tool_call_id,
-    )
-    user_parts: list[_messages.UserPromptPart] = []
+    for call in tool_calls:
+        yield _messages.FunctionToolCallEvent(call)
-    if isinstance(tool_result, _messages.ToolReturn):
-        if (
-            isinstance(tool_result.return_value, _messages.MultiModalContentTypes)
-            or isinstance(tool_result.return_value, list)
-            and any(
-                isinstance(content, _messages.MultiModalContentTypes)
-                for content in tool_result.return_value  # type: ignore
-            )
-        ):
-            raise exceptions.UserError(
-                f'The `return_value` of tool {tool_call.tool_name!r} contains invalid nested `MultiModalContentTypes` objects. '
-                f'Please use `content` instead.'
+    # Run all tool tasks in parallel
+    with tracer.start_as_current_span(
+        'running tools',
+        attributes={
+            'tools': [call.tool_name for call in tool_calls],
+            'logfire.msg': f'running {len(tool_calls)} tool{"" if len(tool_calls) == 1 else "s"}',
+        },
+    ):
+        tasks = [
+            asyncio.create_task(
+                _call_tool(tool_manager, call, deferred_tool_results.get(call.tool_call_id), usage_limits),
+                name=call.tool_name,
             )
+            for call in tool_calls
+        ]
+        pending = tasks
+        while pending:
+            done, pending = await asyncio.wait(pending, return_when=asyncio.FIRST_COMPLETED)
+            for task in done:
+                index = tasks.index(task)
+                try:
+                    tool_part, tool_user_part = task.result()
+                except exceptions.CallDeferred:
+                    deferred_calls_by_index[index] = 'external'
+                except exceptions.ApprovalRequired:
+                    deferred_calls_by_index[index] = 'unapproved'
+                else:
+                    yield _messages.FunctionToolResultEvent(tool_part)
-        tool_part.content = tool_result.return_value  # type: ignore
-        tool_part.metadata = tool_result.metadata
-        if tool_result.content:
-            user_parts.append(
-                _messages.UserPromptPart(
-                    content=tool_result.content,
-                    part_kind='user-prompt',
-                )
+                    tool_parts_by_index[index] = tool_part
+                    if tool_user_part:
+                        user_parts_by_index[index] = tool_user_part
+    # We append the results at the end, rather than as they are received, to retain a consistent ordering
+    # This is mostly just to simplify testing
+    for k in sorted(tool_parts_by_index):
+        output_parts.append(tool_parts_by_index[k])
+    for k in sorted(user_parts_by_index):
+        output_parts.append(user_parts_by_index[k])
+    for k in sorted(deferred_calls_by_index):
+        output_deferred_calls[deferred_calls_by_index[k]].append(tool_calls[k])
+async def _call_tool(
+    tool_manager: ToolManager[DepsT],
+    tool_call: _messages.ToolCallPart,
+    tool_call_result: DeferredToolResult | None,
+    usage_limits: _usage.UsageLimits | None,
+) -> tuple[_messages.ToolReturnPart | _messages.RetryPromptPart, _messages.UserPromptPart | None]:
+    try:
+        if tool_call_result is None:
+            tool_result = await tool_manager.handle_call(tool_call, usage_limits=usage_limits)
+        elif isinstance(tool_call_result, ToolApproved):
+            if tool_call_result.override_args is not None:
+                tool_call = dataclasses.replace(tool_call, args=tool_call_result.override_args)
+            tool_result = await tool_manager.handle_call(tool_call, usage_limits=usage_limits)
+        elif isinstance(tool_call_result, ToolDenied):
+            return _messages.ToolReturnPart(
+                tool_name=tool_call.tool_name,
+                content=tool_call_result.message,
+                tool_call_id=tool_call.tool_call_id,
+            ), None
+        elif isinstance(tool_call_result, exceptions.ModelRetry):
+            m = _messages.RetryPromptPart(
+                content=tool_call_result.message,
+                tool_name=tool_call.tool_name,
+                tool_call_id=tool_call.tool_call_id,
             )
+            raise ToolRetryError(m)
+        elif isinstance(tool_call_result, _messages.RetryPromptPart):
+            tool_call_result.tool_name = tool_call.tool_name
+            tool_call_result.tool_call_id = tool_call.tool_call_id
+            raise ToolRetryError(tool_call_result)
+        else:
+            tool_result = tool_call_result
+    except ToolRetryError as e:
+        return e.tool_retry, None
+    if isinstance(tool_result, _messages.ToolReturn):
+        tool_return = tool_result
     else:
+        result_is_list = isinstance(tool_result, list)
+        contents = cast(list[Any], tool_result) if result_is_list else [tool_result]
-        def process_content(content: Any) -> Any:
+        return_values: list[Any] = []
+        user_contents: list[str | _messages.UserContent] = []
+        for content in contents:
             if isinstance(content, _messages.ToolReturn):
                 raise exceptions.UserError(
                     f'The return value of tool {tool_call.tool_name!r} contains invalid nested `ToolReturn` objects. '
                     f'`ToolReturn` should be used directly.'
                 )
-            elif isinstance(content, _messages.MultiModalContentTypes):
-                if isinstance(content, _messages.BinaryContent):
-                    identifier = content.identifier or multi_modal_content_identifier(content.data)
-                else:
-                    identifier = multi_modal_content_identifier(content.url)
+            elif isinstance(content, _messages.MultiModalContent):
+                identifier = content.identifier
-                user_parts.append(
-                    _messages.UserPromptPart(
-                        content=[f'This is file {identifier}:', content],
-                        part_kind='user-prompt',
-                    )
-                )
-                return f'See file {identifier}'
+                return_values.append(f'See file {identifier}')
+                user_contents.extend([f'This is file {identifier}:', content])
+            else:
+                return_values.append(content)
-            return content
+        tool_return = _messages.ToolReturn(
+            return_value=return_values[0] if len(return_values) == 1 and not result_is_list else return_values,
+            content=user_contents,
+        )
-        if isinstance(tool_result, list):
-            contents = cast(list[Any], tool_result)
-            tool_part.content = [process_content(content) for content in contents]
-        else:
-            tool_part.content = process_content(tool_result)
+    if (
+        isinstance(tool_return.return_value, _messages.MultiModalContent)
+        or isinstance(tool_return.return_value, list)
+        and any(
+            isinstance(content, _messages.MultiModalContent)
+            for content in tool_return.return_value  # type: ignore
+        )
+    ):
+        raise exceptions.UserError(
+            f'The `return_value` of tool {tool_call.tool_name!r} contains invalid nested `MultiModalContent` objects. '
+            f'Please use `content` instead.'
+        )
+    return_part = _messages.ToolReturnPart(
+        tool_name=tool_call.tool_name,
+        tool_call_id=tool_call.tool_call_id,
+        content=tool_return.return_value,  # type: ignore
+        metadata=tool_return.metadata,
+    )
+    user_part: _messages.UserPromptPart | None = None
+    if tool_return.content:
+        user_part = _messages.UserPromptPart(
+            content=tool_return.content,
+            part_kind='user-prompt',
+        )
-    return (tool_part, user_parts)
+    return return_part, user_part
 @dataclasses.dataclass

pydantic-ai-slim 0.8.0__py3-none-any.whl → 1.0.0__py3-none-any.whl

Potentially problematic release.

pydantic-ai-slim 0.8.0py3-none-any.whl → 1.0.0py3-none-any.whl