PyPI - prompture - Versions diffs - 0.0.35__py3-none-any.whl → 0.0.40.dev1__py3-none-any.whl - Mend

prompture 0.0.35py3-none-any.whl → 0.0.40.dev1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (52) hide show

prompture/__init__.py +132 -3
prompture/_version.py +2 -2
prompture/agent.py +924 -0
prompture/agent_types.py +156 -0
prompture/async_agent.py +880 -0
prompture/async_conversation.py +208 -17
prompture/async_core.py +16 -0
prompture/async_driver.py +63 -0
prompture/async_groups.py +551 -0
prompture/conversation.py +222 -18
prompture/core.py +46 -12
prompture/cost_mixin.py +37 -0
prompture/discovery.py +132 -44
prompture/driver.py +77 -0
prompture/drivers/__init__.py +5 -1
prompture/drivers/async_azure_driver.py +11 -5
prompture/drivers/async_claude_driver.py +184 -9
prompture/drivers/async_google_driver.py +222 -28
prompture/drivers/async_grok_driver.py +11 -5
prompture/drivers/async_groq_driver.py +11 -5
prompture/drivers/async_lmstudio_driver.py +74 -5
prompture/drivers/async_ollama_driver.py +13 -3
prompture/drivers/async_openai_driver.py +162 -5
prompture/drivers/async_openrouter_driver.py +11 -5
prompture/drivers/async_registry.py +5 -1
prompture/drivers/azure_driver.py +10 -4
prompture/drivers/claude_driver.py +17 -1
prompture/drivers/google_driver.py +227 -33
prompture/drivers/grok_driver.py +11 -5
prompture/drivers/groq_driver.py +11 -5
prompture/drivers/lmstudio_driver.py +73 -8
prompture/drivers/ollama_driver.py +16 -5
prompture/drivers/openai_driver.py +26 -11
prompture/drivers/openrouter_driver.py +11 -5
prompture/drivers/vision_helpers.py +153 -0
prompture/group_types.py +147 -0
prompture/groups.py +530 -0
prompture/image.py +180 -0
prompture/ledger.py +252 -0
prompture/model_rates.py +112 -2
prompture/persistence.py +254 -0
prompture/persona.py +482 -0
prompture/serialization.py +218 -0
prompture/settings.py +1 -0
prompture-0.0.40.dev1.dist-info/METADATA +369 -0
prompture-0.0.40.dev1.dist-info/RECORD +78 -0
prompture-0.0.35.dist-info/METADATA +0 -464
prompture-0.0.35.dist-info/RECORD +0 -66
{prompture-0.0.35.dist-info → prompture-0.0.40.dev1.dist-info}/WHEEL +0 -0
{prompture-0.0.35.dist-info → prompture-0.0.40.dev1.dist-info}/entry_points.txt +0 -0
{prompture-0.0.35.dist-info → prompture-0.0.40.dev1.dist-info}/licenses/LICENSE +0 -0
{prompture-0.0.35.dist-info → prompture-0.0.40.dev1.dist-info}/top_level.txt +0 -0

prompture/agent.py ADDED Viewed

@@ -0,0 +1,924 @@
+"""Agent framework for Prompture.
+Provides a reusable :class:`Agent` that wraps a ReAct-style loop around
+:class:`~prompture.conversation.Conversation`, with optional structured
+output via Pydantic models and tool support via :class:`ToolRegistry`.
+Example::
+    from prompture import Agent
+    agent = Agent("openai/gpt-4o", system_prompt="You are a helpful assistant.")
+    result = agent.run("What is the capital of France?")
+    print(result.output)
+"""
+from __future__ import annotations
+import inspect
+import json
+import logging
+import time
+import typing
+from collections.abc import Callable, Generator, Iterator
+from typing import Any, Generic
+from pydantic import BaseModel
+from .agent_types import (
+    AgentCallbacks,
+    AgentResult,
+    AgentState,
+    AgentStep,
+    DepsType,
+    ModelRetry,
+    RunContext,
+    StepType,
+    StreamEvent,
+    StreamEventType,
+)
+from .callbacks import DriverCallbacks
+from .conversation import Conversation
+from .driver import Driver
+from .persona import Persona
+from .session import UsageSession
+from .tools import clean_json_text
+from .tools_schema import ToolDefinition, ToolRegistry
+logger = logging.getLogger("prompture.agent")
+_OUTPUT_PARSE_MAX_RETRIES = 3
+_OUTPUT_GUARDRAIL_MAX_RETRIES = 3
+# ------------------------------------------------------------------
+# Module-level helpers for RunContext injection
+# ------------------------------------------------------------------
+def _tool_wants_context(fn: Callable[..., Any]) -> bool:
+    """Check whether *fn*'s first parameter is annotated as :class:`RunContext`.
+    Uses :func:`typing.get_type_hints` to resolve string annotations
+    (from ``from __future__ import annotations``).  Falls back to raw
+    ``__annotations__`` when ``get_type_hints`` cannot resolve local types.
+    """
+    sig = inspect.signature(fn)
+    params = list(sig.parameters.keys())
+    if not params:
+        return False
+    first_param = params[0]
+    if first_param == "self":
+        if len(params) < 2:
+            return False
+        first_param = params[1]
+    # Try get_type_hints first (resolves string annotations)
+    annotation = None
+    try:
+        hints = typing.get_type_hints(fn, include_extras=True)
+        annotation = hints.get(first_param)
+    except Exception:
+        # get_type_hints can fail with local/forward references; fall back to raw annotation
+        pass
+    # Fallback: inspect raw annotation (may be a string)
+    if annotation is None:
+        raw = sig.parameters[first_param].annotation
+        if raw is inspect.Parameter.empty:
+            return False
+        annotation = raw
+    # String annotation: check if it starts with "RunContext"
+    if isinstance(annotation, str):
+        return annotation == "RunContext" or annotation.startswith("RunContext[")
+    # Direct match
+    if annotation is RunContext:
+        return True
+    # Generic alias: RunContext[X]
+    origin = getattr(annotation, "__origin__", None)
+    return origin is RunContext
+def _get_first_param_name(fn: Callable[..., Any]) -> str:
+    """Return the name of the first non-self parameter of *fn*."""
+    sig = inspect.signature(fn)
+    for name, _param in sig.parameters.items():
+        if name != "self":
+            return name
+    return ""
+# ------------------------------------------------------------------
+# Agent
+# ------------------------------------------------------------------
+class Agent(Generic[DepsType]):
+    """A reusable agent that executes a ReAct loop with tool support.
+    Each call to :meth:`run` creates a fresh :class:`Conversation`,
+    preventing state leakage between runs.  The Agent itself is a
+    template holding model config, tools, and system prompt.
+    Args:
+        model: Model string in ``"provider/model"`` format.
+        driver: Pre-built driver instance (useful for testing).
+        tools: Initial tools as a list of callables or a
+            :class:`ToolRegistry`.
+        system_prompt: System prompt prepended to every run.  May also
+            be a callable ``(RunContext) -> str`` for dynamic prompts.
+        output_type: Optional Pydantic model class.  When set, the
+            final LLM response is parsed and validated against this type.
+        max_iterations: Maximum tool-use rounds per run.
+        max_cost: Soft budget in USD.  When exceeded, output parse and
+            guardrail retries are skipped.
+        options: Extra driver options forwarded to every call.
+        deps_type: Type hint for dependencies (for docs/IDE only).
+        agent_callbacks: Agent-level observability callbacks.
+        input_guardrails: Functions called before the prompt is sent.
+        output_guardrails: Functions called after output is parsed.
+    """
+    def __init__(
+        self,
+        model: str = "",
+        *,
+        driver: Driver | None = None,
+        tools: list[Callable[..., Any]] | ToolRegistry | None = None,
+        system_prompt: str | Persona | Callable[..., str] | None = None,
+        output_type: type[BaseModel] | None = None,
+        max_iterations: int = 10,
+        max_cost: float | None = None,
+        options: dict[str, Any] | None = None,
+        deps_type: type | None = None,
+        agent_callbacks: AgentCallbacks | None = None,
+        input_guardrails: list[Callable[..., Any]] | None = None,
+        output_guardrails: list[Callable[..., Any]] | None = None,
+        name: str = "",
+        description: str = "",
+        output_key: str | None = None,
+    ) -> None:
+        if not model and driver is None:
+            raise ValueError("Either model or driver must be provided")
+        self._model = model
+        self._driver = driver
+        self._system_prompt = system_prompt
+        self._output_type = output_type
+        self._max_iterations = max_iterations
+        self._max_cost = max_cost
+        self._options = dict(options) if options else {}
+        self._deps_type = deps_type
+        self._agent_callbacks = agent_callbacks or AgentCallbacks()
+        self._input_guardrails = list(input_guardrails) if input_guardrails else []
+        self._output_guardrails = list(output_guardrails) if output_guardrails else []
+        self.name = name
+        self.description = description
+        self.output_key = output_key
+        # Build internal tool registry
+        self._tools = ToolRegistry()
+        if isinstance(tools, ToolRegistry):
+            self._tools = tools
+        elif tools is not None:
+            for fn in tools:
+                self._tools.register(fn)
+        self._state = AgentState.idle
+        self._stop_requested = False
+    # ------------------------------------------------------------------
+    # Public API
+    # ------------------------------------------------------------------
+    def tool(self, fn: Callable[..., Any]) -> Callable[..., Any]:
+        """Decorator to register a function as a tool on this agent.
+        Returns the original function unchanged.
+        """
+        self._tools.register(fn)
+        return fn
+    @property
+    def state(self) -> AgentState:
+        """Current lifecycle state of the agent."""
+        return self._state
+    def stop(self) -> None:
+        """Request graceful shutdown after the current iteration."""
+        self._stop_requested = True
+    def as_tool(
+        self,
+        name: str | None = None,
+        description: str | None = None,
+        custom_output_extractor: Callable[[AgentResult], str] | None = None,
+    ) -> ToolDefinition:
+        """Wrap this Agent as a callable tool for another Agent.
+        Creates a :class:`ToolDefinition` whose function accepts a ``prompt``
+        string, runs this agent, and returns the output text.
+        Args:
+            name: Tool name (defaults to ``self.name`` or ``"agent_tool"``).
+            description: Tool description (defaults to ``self.description``).
+            custom_output_extractor: Optional function to extract a string
+                from :class:`AgentResult`.  Defaults to ``result.output_text``.
+        """
+        tool_name = name or self.name or "agent_tool"
+        tool_desc = description or self.description or f"Run agent {tool_name}"
+        agent = self
+        extractor = custom_output_extractor
+        def _call_agent(prompt: str) -> str:
+            """Run the wrapped agent with the given prompt."""
+            result = agent.run(prompt)
+            if extractor is not None:
+                return extractor(result)
+            return result.output_text
+        return ToolDefinition(
+            name=tool_name,
+            description=tool_desc,
+            parameters={
+                "type": "object",
+                "properties": {
+                    "prompt": {"type": "string", "description": "The prompt to send to the agent"},
+                },
+                "required": ["prompt"],
+            },
+            function=_call_agent,
+        )
+    def run(self, prompt: str, *, deps: Any = None) -> AgentResult:
+        """Execute the agent loop to completion.
+        Creates a fresh :class:`Conversation`, sends the prompt,
+        handles any tool calls, and optionally parses the final
+        response into an ``output_type`` Pydantic model.
+        Args:
+            prompt: The user prompt to send.
+            deps: Optional dependencies injected into :class:`RunContext`.
+        """
+        self._state = AgentState.running
+        self._stop_requested = False
+        steps: list[AgentStep] = []
+        try:
+            result = self._execute(prompt, steps, deps)
+            self._state = AgentState.idle
+            return result
+        except Exception:
+            self._state = AgentState.errored
+            raise
+    # ------------------------------------------------------------------
+    # RunContext helpers
+    # ------------------------------------------------------------------
+    def _build_run_context(
+        self,
+        prompt: str,
+        deps: Any,
+        session: UsageSession,
+        messages: list[dict[str, Any]],
+        iteration: int,
+    ) -> RunContext[Any]:
+        """Create a :class:`RunContext` snapshot for the current run."""
+        return RunContext(
+            deps=deps,
+            model=self._model,
+            usage=session.summary(),
+            messages=list(messages),
+            iteration=iteration,
+            prompt=prompt,
+        )
+    # ------------------------------------------------------------------
+    # Tool wrapping (RunContext injection + ModelRetry + callbacks)
+    # ------------------------------------------------------------------
+    def _wrap_tools_with_context(self, ctx: RunContext[Any]) -> ToolRegistry:
+        """Return a new :class:`ToolRegistry` with wrapped tool functions.
+        For each registered tool:
+        - If the tool's first param is ``RunContext``, inject *ctx* automatically.
+        - Catch :class:`ModelRetry` and convert to an error string.
+        - Fire ``agent_callbacks.on_tool_start`` / ``on_tool_end``.
+        - Strip the ``RunContext`` parameter from the JSON schema sent to the LLM.
+        """
+        if not self._tools:
+            return ToolRegistry()
+        new_registry = ToolRegistry()
+        cb = self._agent_callbacks
+        for td in self._tools.definitions:
+            wants_ctx = _tool_wants_context(td.function)
+            original_fn = td.function
+            tool_name = td.name
+            def _make_wrapper(
+                _fn: Callable[..., Any],
+                _wants: bool,
+                _name: str,
+                _cb: AgentCallbacks = cb,
+            ) -> Callable[..., Any]:
+                def wrapper(**kwargs: Any) -> Any:
+                    if _cb.on_tool_start:
+                        _cb.on_tool_start(_name, kwargs)
+                    try:
+                        if _wants:
+                            result = _fn(ctx, **kwargs)
+                        else:
+                            result = _fn(**kwargs)
+                    except ModelRetry as exc:
+                        result = f"Error: {exc.message}"
+                    if _cb.on_tool_end:
+                        _cb.on_tool_end(_name, result)
+                    return result
+                return wrapper
+            wrapped = _make_wrapper(original_fn, wants_ctx, tool_name)
+            # Build schema: strip RunContext param if present
+            params = dict(td.parameters)
+            if wants_ctx:
+                ctx_param_name = _get_first_param_name(td.function)
+                props = dict(params.get("properties", {}))
+                props.pop(ctx_param_name, None)
+                params = dict(params)
+                params["properties"] = props
+                req = list(params.get("required", []))
+                if ctx_param_name in req:
+                    req.remove(ctx_param_name)
+                if req:
+                    params["required"] = req
+                elif "required" in params:
+                    del params["required"]
+            new_td = ToolDefinition(
+                name=td.name,
+                description=td.description,
+                parameters=params,
+                function=wrapped,
+            )
+            new_registry.add(new_td)
+        return new_registry
+    # ------------------------------------------------------------------
+    # Guardrails
+    # ------------------------------------------------------------------
+    def _run_input_guardrails(self, ctx: RunContext[Any], prompt: str) -> str:
+        """Execute input guardrails in order. Returns the (possibly transformed) prompt.
+        Each guardrail receives ``(ctx, prompt)`` and may:
+        - Return a ``str`` to transform the prompt.
+        - Return ``None`` to leave it unchanged.
+        - Raise :class:`GuardrailError` to reject entirely.
+        """
+        for guardrail in self._input_guardrails:
+            result = guardrail(ctx, prompt)
+            if result is not None:
+                prompt = result
+        return prompt
+    def _run_output_guardrails(
+        self,
+        ctx: RunContext[Any],
+        result: AgentResult,
+        conv: Conversation,
+        session: UsageSession,
+        steps: list[AgentStep],
+        all_tool_calls: list[dict[str, Any]],
+    ) -> AgentResult:
+        """Execute output guardrails. Returns the (possibly modified) result.
+        Each guardrail receives ``(ctx, result)`` and may:
+        - Return ``None`` to pass (no change).
+        - Return an :class:`AgentResult` to modify the result.
+        - Raise :class:`ModelRetry` to re-prompt the LLM (up to 3 retries).
+        """
+        for guardrail in self._output_guardrails:
+            for attempt in range(_OUTPUT_GUARDRAIL_MAX_RETRIES):
+                try:
+                    guard_result = guardrail(ctx, result)
+                    if guard_result is not None:
+                        result = guard_result
+                    break  # guardrail passed
+                except ModelRetry as exc:
+                    if self._is_over_budget(session):
+                        logger.debug("Over budget, skipping output guardrail retry")
+                        break
+                    if attempt >= _OUTPUT_GUARDRAIL_MAX_RETRIES - 1:
+                        raise ValueError(
+                            f"Output guardrail failed after {_OUTPUT_GUARDRAIL_MAX_RETRIES} retries: {exc.message}"
+                        ) from exc
+                    # Re-prompt the LLM
+                    retry_text = conv.ask(
+                        f"Your response did not pass validation. Error: {exc.message}\n\nPlease try again."
+                    )
+                    self._extract_steps(conv.messages[-2:], steps, all_tool_calls)
+                    # Re-parse if output_type is set
+                    if self._output_type is not None:
+                        try:
+                            cleaned = clean_json_text(retry_text)
+                            parsed = json.loads(cleaned)
+                            output = self._output_type.model_validate(parsed)
+                        except Exception:
+                            output = retry_text
+                    else:
+                        output = retry_text
+                    result = AgentResult(
+                        output=output,
+                        output_text=retry_text,
+                        messages=conv.messages,
+                        usage=conv.usage,
+                        steps=steps,
+                        all_tool_calls=all_tool_calls,
+                        state=AgentState.idle,
+                        run_usage=session.summary(),
+                    )
+        return result
+    # ------------------------------------------------------------------
+    # Budget check
+    # ------------------------------------------------------------------
+    def _is_over_budget(self, session: UsageSession) -> bool:
+        """Return True if max_cost is set and the session has exceeded it."""
+        if self._max_cost is None:
+            return False
+        return session.total_cost >= self._max_cost
+    # ------------------------------------------------------------------
+    # Internals
+    # ------------------------------------------------------------------
+    def _resolve_system_prompt(self, ctx: RunContext[Any] | None = None) -> str | None:
+        """Build the system prompt, appending output schema if needed."""
+        parts: list[str] = []
+        if self._system_prompt is not None:
+            if isinstance(self._system_prompt, Persona):
+                # Render Persona with RunContext variables if available
+                render_kwargs: dict[str, Any] = {}
+                if ctx is not None:
+                    render_kwargs["model"] = ctx.model
+                    render_kwargs["iteration"] = ctx.iteration
+                parts.append(self._system_prompt.render(**render_kwargs))
+            elif callable(self._system_prompt) and not isinstance(self._system_prompt, str):
+                if ctx is not None:
+                    parts.append(self._system_prompt(ctx))
+                else:
+                    # Fallback: call without context (shouldn't happen in normal flow)
+                    parts.append(self._system_prompt(None))  # type: ignore[arg-type]
+            else:
+                parts.append(str(self._system_prompt))
+        if self._output_type is not None:
+            schema = self._output_type.model_json_schema()
+            schema_str = json.dumps(schema, indent=2)
+            parts.append(
+                "You MUST respond with a single JSON object (no markdown, "
+                "no extra text) that validates against this JSON schema:\n"
+                f"{schema_str}\n\n"
+                "Use double quotes for keys and strings. "
+                "If a value is unknown use null."
+            )
+        return "\n\n".join(parts) if parts else None
+    def _build_conversation(
+        self,
+        system_prompt: str | None = None,
+        tools: ToolRegistry | None = None,
+        driver_callbacks: DriverCallbacks | None = None,
+    ) -> Conversation:
+        """Create a fresh Conversation for a single run."""
+        effective_tools = tools if tools is not None else (self._tools if self._tools else None)
+        kwargs: dict[str, Any] = {
+            "system_prompt": system_prompt if system_prompt is not None else self._resolve_system_prompt(),
+            "tools": effective_tools,
+            "max_tool_rounds": self._max_iterations,
+        }
+        if self._options:
+            kwargs["options"] = self._options
+        if driver_callbacks is not None:
+            kwargs["callbacks"] = driver_callbacks
+        if self._driver is not None:
+            kwargs["driver"] = self._driver
+        else:
+            kwargs["model_name"] = self._model
+        return Conversation(**kwargs)
+    def _execute(self, prompt: str, steps: list[AgentStep], deps: Any) -> AgentResult:
+        """Core execution: run conversation, extract steps, parse output."""
+        # 1. Create per-run UsageSession and wire into DriverCallbacks
+        session = UsageSession()
+        driver_callbacks = DriverCallbacks(
+            on_response=session.record,
+            on_error=session.record_error,
+        )
+        # 2. Build initial RunContext
+        ctx = self._build_run_context(prompt, deps, session, [], 0)
+        # 3. Run input guardrails
+        effective_prompt = self._run_input_guardrails(ctx, prompt)
+        # 4. Resolve system prompt (call it if callable, passing ctx)
+        resolved_system_prompt = self._resolve_system_prompt(ctx)
+        # 5. Wrap tools with context
+        wrapped_tools = self._wrap_tools_with_context(ctx)
+        # 6. Build Conversation
+        conv = self._build_conversation(
+            system_prompt=resolved_system_prompt,
+            tools=wrapped_tools if wrapped_tools else None,
+            driver_callbacks=driver_callbacks,
+        )
+        # 7. Fire on_iteration callback
+        if self._agent_callbacks.on_iteration:
+            self._agent_callbacks.on_iteration(0)
+        # 8. Ask the conversation (handles full tool loop internally)
+        t0 = time.perf_counter()
+        response_text = conv.ask(effective_prompt)
+        elapsed_ms = (time.perf_counter() - t0) * 1000
+        # 9. Extract steps and tool calls from conversation messages
+        all_tool_calls: list[dict[str, Any]] = []
+        self._extract_steps(conv.messages, steps, all_tool_calls)
+        # Handle output_type parsing
+        if self._output_type is not None:
+            output, output_text = self._parse_output(conv, response_text, steps, all_tool_calls, elapsed_ms, session)
+        else:
+            output = response_text
+            output_text = response_text
+        # Build result with run_usage
+        result = AgentResult(
+            output=output,
+            output_text=output_text,
+            messages=conv.messages,
+            usage=conv.usage,
+            steps=steps,
+            all_tool_calls=all_tool_calls,
+            state=AgentState.idle,
+            run_usage=session.summary(),
+        )
+        # 10. Run output guardrails
+        if self._output_guardrails:
+            result = self._run_output_guardrails(ctx, result, conv, session, steps, all_tool_calls)
+        # 11. Fire callbacks
+        if self._agent_callbacks.on_step:
+            for step in steps:
+                self._agent_callbacks.on_step(step)
+        if self._agent_callbacks.on_output:
+            self._agent_callbacks.on_output(result)
+        return result
+    def _extract_steps(
+        self,
+        messages: list[dict[str, Any]],
+        steps: list[AgentStep],
+        all_tool_calls: list[dict[str, Any]],
+    ) -> None:
+        """Scan conversation messages and populate steps and tool_calls."""
+        now = time.time()
+        for msg in messages:
+            role = msg.get("role", "")
+            if role == "assistant":
+                tc_list = msg.get("tool_calls", [])
+                if tc_list:
+                    # Assistant message with tool calls
+                    for tc in tc_list:
+                        fn = tc.get("function", {})
+                        name = fn.get("name", tc.get("name", ""))
+                        raw_args = fn.get("arguments", tc.get("arguments", "{}"))
+                        if isinstance(raw_args, str):
+                            try:
+                                args = json.loads(raw_args)
+                            except json.JSONDecodeError:
+                                args = {}
+                        else:
+                            args = raw_args
+                        steps.append(
+                            AgentStep(
+                                step_type=StepType.tool_call,
+                                timestamp=now,
+                                content=msg.get("content", ""),
+                                tool_name=name,
+                                tool_args=args,
+                            )
+                        )
+                        all_tool_calls.append({"name": name, "arguments": args, "id": tc.get("id", "")})
+                else:
+                    # Final assistant message (no tool calls)
+                    steps.append(
+                        AgentStep(
+                            step_type=StepType.output,
+                            timestamp=now,
+                            content=msg.get("content", ""),
+                        )
+                    )
+            elif role == "tool":
+                steps.append(
+                    AgentStep(
+                        step_type=StepType.tool_result,
+                        timestamp=now,
+                        content=msg.get("content", ""),
+                        tool_name=msg.get("tool_call_id"),
+                    )
+                )
+    def _parse_output(
+        self,
+        conv: Conversation,
+        response_text: str,
+        steps: list[AgentStep],
+        all_tool_calls: list[dict[str, Any]],
+        elapsed_ms: float,
+        session: UsageSession | None = None,
+    ) -> tuple[Any, str]:
+        """Try to parse ``response_text`` as the output_type, with retries."""
+        assert self._output_type is not None
+        last_error: Exception | None = None
+        text = response_text
+        for attempt in range(_OUTPUT_PARSE_MAX_RETRIES):
+            try:
+                cleaned = clean_json_text(text)
+                parsed = json.loads(cleaned)
+                model_instance = self._output_type.model_validate(parsed)
+                return model_instance, text
+            except Exception as exc:
+                last_error = exc
+                if attempt < _OUTPUT_PARSE_MAX_RETRIES - 1:
+                    # Check budget before retrying
+                    if session is not None and self._is_over_budget(session):
+                        logger.debug("Over budget, skipping output parse retry")
+                        break
+                    logger.debug("Output parse attempt %d failed: %s", attempt + 1, exc)
+                    retry_msg = (
+                        f"Your previous response could not be parsed as valid JSON "
+                        f"matching the required schema. Error: {exc}\n\n"
+                        f"Please try again and respond ONLY with valid JSON."
+                    )
+                    text = conv.ask(retry_msg)
+                    # Record the retry step
+                    self._extract_steps(conv.messages[-2:], steps, all_tool_calls)
+        raise ValueError(
+            f"Failed to parse output as {self._output_type.__name__} "
+            f"after {_OUTPUT_PARSE_MAX_RETRIES} attempts: {last_error}"
+        )
+    # ------------------------------------------------------------------
+    # iter() — step-by-step inspection
+    # ------------------------------------------------------------------
+    def iter(self, prompt: str, *, deps: Any = None) -> AgentIterator:
+        """Execute the agent loop and iterate over steps.
+        Returns an :class:`AgentIterator` that yields :class:`AgentStep`
+        objects.  After iteration completes, the final :class:`AgentResult`
+        is available via :attr:`AgentIterator.result`.
+        Note:
+            In Phase 3c the conversation's tool loop runs to completion
+            before steps are yielded.  True mid-loop yielding is deferred.
+        """
+        gen = self._execute_iter(prompt, deps)
+        return AgentIterator(gen)
+    def _execute_iter(self, prompt: str, deps: Any) -> Generator[AgentStep, None, AgentResult]:
+        """Generator that executes the agent loop and yields each step."""
+        self._state = AgentState.running
+        self._stop_requested = False
+        steps: list[AgentStep] = []
+        try:
+            result = self._execute(prompt, steps, deps)
+            # Yield each step one at a time
+            yield from result.steps
+            self._state = AgentState.idle
+            return result
+        except Exception:
+            self._state = AgentState.errored
+            raise
+    # ------------------------------------------------------------------
+    # run_stream() — streaming output
+    # ------------------------------------------------------------------
+    def run_stream(self, prompt: str, *, deps: Any = None) -> StreamedAgentResult:
+        """Execute the agent loop with streaming output.
+        Returns a :class:`StreamedAgentResult` that yields
+        :class:`StreamEvent` objects.  After iteration completes, the
+        final :class:`AgentResult` is available via
+        :attr:`StreamedAgentResult.result`.
+        When tools are registered, streaming falls back to non-streaming
+        ``conv.ask()`` and yields the full response as a single
+        ``text_delta`` event.
+        """
+        gen = self._execute_stream(prompt, deps)
+        return StreamedAgentResult(gen)
+    def _execute_stream(self, prompt: str, deps: Any) -> Generator[StreamEvent, None, AgentResult]:
+        """Generator that executes the agent loop and yields stream events."""
+        self._state = AgentState.running
+        self._stop_requested = False
+        steps: list[AgentStep] = []
+        try:
+            # 1. Create per-run UsageSession and wire into DriverCallbacks
+            session = UsageSession()
+            driver_callbacks = DriverCallbacks(
+                on_response=session.record,
+                on_error=session.record_error,
+            )
+            # 2. Build initial RunContext
+            ctx = self._build_run_context(prompt, deps, session, [], 0)
+            # 3. Run input guardrails
+            effective_prompt = self._run_input_guardrails(ctx, prompt)
+            # 4. Resolve system prompt
+            resolved_system_prompt = self._resolve_system_prompt(ctx)
+            # 5. Wrap tools with context
+            wrapped_tools = self._wrap_tools_with_context(ctx)
+            has_tools = bool(wrapped_tools)
+            # 6. Build Conversation
+            conv = self._build_conversation(
+                system_prompt=resolved_system_prompt,
+                tools=wrapped_tools if wrapped_tools else None,
+                driver_callbacks=driver_callbacks,
+            )
+            # 7. Fire on_iteration callback
+            if self._agent_callbacks.on_iteration:
+                self._agent_callbacks.on_iteration(0)
+            if has_tools:
+                # Tools registered: fall back to non-streaming conv.ask()
+                response_text = conv.ask(effective_prompt)
+                # Yield the full text as a single delta
+                yield StreamEvent(
+                    event_type=StreamEventType.text_delta,
+                    data=response_text,
+                )
+            else:
+                # No tools: use streaming if available
+                response_text = ""
+                stream_iter: Iterator[str] = conv.ask_stream(effective_prompt)
+                for chunk in stream_iter:
+                    response_text += chunk
+                    yield StreamEvent(
+                        event_type=StreamEventType.text_delta,
+                        data=chunk,
+                    )
+            # 8. Extract steps
+            all_tool_calls: list[dict[str, Any]] = []
+            self._extract_steps(conv.messages, steps, all_tool_calls)
+            # 9. Parse output
+            if self._output_type is not None:
+                output, output_text = self._parse_output(conv, response_text, steps, all_tool_calls, 0.0, session)
+            else:
+                output = response_text
+                output_text = response_text
+            # 10. Build result
+            result = AgentResult(
+                output=output,
+                output_text=output_text,
+                messages=conv.messages,
+                usage=conv.usage,
+                steps=steps,
+                all_tool_calls=all_tool_calls,
+                state=AgentState.idle,
+                run_usage=session.summary(),
+            )
+            # 11. Run output guardrails
+            if self._output_guardrails:
+                result = self._run_output_guardrails(ctx, result, conv, session, steps, all_tool_calls)
+            # 12. Fire callbacks
+            if self._agent_callbacks.on_step:
+                for step in steps:
+                    self._agent_callbacks.on_step(step)
+            if self._agent_callbacks.on_output:
+                self._agent_callbacks.on_output(result)
+            # 13. Yield final output event
+            yield StreamEvent(
+                event_type=StreamEventType.output,
+                data=result,
+            )
+            self._state = AgentState.idle
+            return result
+        except Exception:
+            self._state = AgentState.errored
+            raise
+# ------------------------------------------------------------------
+# AgentIterator
+# ------------------------------------------------------------------
+class AgentIterator:
+    """Wraps the :meth:`Agent.iter` generator, capturing the final result.
+    After iteration completes (the ``for`` loop ends), the
+    :attr:`result` property holds the :class:`AgentResult`.
+    """
+    def __init__(self, gen: Generator[AgentStep, None, AgentResult]) -> None:
+        self._gen = gen
+        self._result: AgentResult | None = None
+    def __iter__(self) -> AgentIterator:
+        return self
+    def __next__(self) -> AgentStep:
+        try:
+            return next(self._gen)
+        except StopIteration as e:
+            self._result = e.value
+            raise
+    @property
+    def result(self) -> AgentResult | None:
+        """The final :class:`AgentResult`, available after iteration completes."""
+        return self._result
+# ------------------------------------------------------------------
+# StreamedAgentResult
+# ------------------------------------------------------------------
+class StreamedAgentResult:
+    """Wraps the :meth:`Agent.run_stream` generator, capturing the final result.
+    Yields :class:`StreamEvent` objects during iteration.  After iteration
+    completes, the :attr:`result` property holds the :class:`AgentResult`.
+    """
+    def __init__(self, gen: Generator[StreamEvent, None, AgentResult]) -> None:
+        self._gen = gen
+        self._result: AgentResult | None = None
+    def __iter__(self) -> StreamedAgentResult:
+        return self
+    def __next__(self) -> StreamEvent:
+        try:
+            return next(self._gen)
+        except StopIteration as e:
+            self._result = e.value
+            raise
+    @property
+    def result(self) -> AgentResult | None:
+        """The final :class:`AgentResult`, available after iteration completes."""
+        return self._result

prompture 0.0.35__py3-none-any.whl → 0.0.40.dev1__py3-none-any.whl

prompture 0.0.35py3-none-any.whl → 0.0.40.dev1py3-none-any.whl