PyPI - flock-core - Versions diffs - 0.5.6__py3-none-any.whl → 0.5.8__py3-none-any.whl - Mend

flock-core 0.5.6py3-none-any.whl → 0.5.8py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of flock-core might be problematic. Click here for more details.

Files changed (23) hide show

flock/agent.py +344 -81
flock/artifacts.py +2 -2
flock/components.py +38 -30
flock/correlation_engine.py +3 -6
flock/dashboard/collector.py +9 -9
flock/dashboard/events.py +8 -8
flock/dashboard/service.py +7 -7
flock/engines/dspy_engine.py +560 -64
flock/engines/examples/simple_batch_engine.py +36 -20
flock/examples.py +2 -2
flock/helper/cli_helper.py +2 -2
flock/logging/formatters/themed_formatter.py +3 -1
flock/mcp/config.py +1 -2
flock/mcp/tool.py +1 -2
flock/orchestrator.py +2 -2
flock/store.py +2 -2
flock/utilities.py +1 -1
flock/visibility.py +3 -3
{flock_core-0.5.6.dist-info → flock_core-0.5.8.dist-info}/METADATA +99 -4
{flock_core-0.5.6.dist-info → flock_core-0.5.8.dist-info}/RECORD +23 -23
{flock_core-0.5.6.dist-info → flock_core-0.5.8.dist-info}/WHEEL +0 -0
{flock_core-0.5.6.dist-info → flock_core-0.5.8.dist-info}/entry_points.txt +0 -0
{flock_core-0.5.6.dist-info → flock_core-0.5.8.dist-info}/licenses/LICENSE +0 -0

flock/agent.py CHANGED Viewed

@@ -4,7 +4,7 @@ from __future__ import annotations
 import asyncio
 import os
-from collections.abc import Sequence
+from collections.abc import Callable, Sequence
 from dataclasses import dataclass
 from typing import TYPE_CHECKING, Any, TypedDict
@@ -64,6 +64,21 @@ class MCPServerConfig(TypedDict, total=False):
 class AgentOutput:
     spec: ArtifactSpec
     default_visibility: Visibility
+    count: int = 1  # Number of artifacts to generate (fan-out)
+    filter_predicate: Callable[[BaseModel], bool] | None = None  # Where clause
+    validate_predicate: Callable[[BaseModel], bool] | list[tuple[Callable, str]] | None = (
+        None  # Validation logic
+    )
+    group_description: str | None = None  # Group description override
+    def __post_init__(self):
+        """Validate field constraints."""
+        if self.count < 1:
+            raise ValueError(f"count must be >= 1, got {self.count}")
+    def is_many(self) -> bool:
+        """Return True if this output generates multiple artifacts (count > 1)."""
+        return self.count > 1
     def apply(
         self,
@@ -85,6 +100,27 @@ class AgentOutput:
         )
+@dataclass
+class OutputGroup:
+    """Represents one .publishes() call.
+    Each OutputGroup triggers one engine execution that generates
+    all artifacts in the group together.
+    """
+    outputs: list[AgentOutput]
+    shared_visibility: Visibility | None = None
+    group_description: str | None = None  # Group-level description override
+    def is_single_call(self) -> bool:
+        """True if this is one engine call generating multiple artifacts.
+        Currently always returns True as each group = one engine call.
+        Future: Could return False for parallel sub-groups.
+        """
+        return True
 class Agent(metaclass=AutoTracedMeta):
     """Executable agent constructed via `AgentBuilder`.
@@ -96,7 +132,7 @@ class Agent(metaclass=AutoTracedMeta):
         self.description: str | None = None
         self._orchestrator = orchestrator
         self.subscriptions: list[Subscription] = []
-        self.outputs: list[AgentOutput] = []
+        self.output_groups: list[OutputGroup] = []
         self.utilities: list[AgentComponent] = []
         self.engines: list[EngineComponent] = []
         self.best_of_n: int = 1
@@ -115,6 +151,11 @@ class Agent(metaclass=AutoTracedMeta):
         self.mcp_server_mounts: dict[str, list[str]] = {}  # Server-specific mount points
         self.tool_whitelist: list[str] | None = None
+    @property
+    def outputs(self) -> list[AgentOutput]:
+        """Backwards compatibility: return flat list of all outputs from all groups."""
+        return [output for group in self.output_groups for output in group.outputs]
     @property
     def identity(self) -> AgentIdentity:
         return AgentIdentity(name=self.name, labels=self.labels, tenant_id=self.tenant_id)
@@ -160,9 +201,40 @@ class Agent(metaclass=AutoTracedMeta):
                 processed_inputs = await self._run_pre_consume(ctx, artifacts)
                 eval_inputs = EvalInputs(artifacts=processed_inputs, state=dict(ctx.state))
                 eval_inputs = await self._run_pre_evaluate(ctx, eval_inputs)
-                result = await self._run_engines(ctx, eval_inputs)
-                result = await self._run_post_evaluate(ctx, eval_inputs, result)
-                outputs = await self._make_outputs(ctx, result)
+                # Phase 3: Call engine ONCE PER OutputGroup
+                all_outputs: list[Artifact] = []
+                if not self.output_groups:
+                    # No output groups: Utility agents that don't publish
+                    # Create empty OutputGroup for engines that may have side effects
+                    empty_group = OutputGroup(outputs=[], group_description=None)
+                    result = await self._run_engines(ctx, eval_inputs, empty_group)
+                    # Run post_evaluate hooks for utility components (e.g., metrics)
+                    result = await self._run_post_evaluate(ctx, eval_inputs, result)
+                    # Utility agents return empty list (no outputs declared)
+                    outputs = []
+                else:
+                    # Loop over each output group
+                    for group_idx, output_group in enumerate(self.output_groups):
+                        # Prepare group-specific context
+                        group_ctx = self._prepare_group_context(ctx, group_idx, output_group)
+                        # Phase 7: Single evaluation path with auto-detection
+                        # Engine's evaluate() auto-detects batch/fan-out from ctx and output_group
+                        result = await self._run_engines(group_ctx, eval_inputs, output_group)
+                        result = await self._run_post_evaluate(group_ctx, eval_inputs, result)
+                        # Extract outputs for THIS group only
+                        group_outputs = await self._make_outputs_for_group(
+                            group_ctx, result, output_group
+                        )
+                        all_outputs.extend(group_outputs)
+                    outputs = all_outputs
                 await self._run_post_publish(ctx, outputs)
                 if self.calls_func:
                     await self._invoke_call(ctx, outputs or processed_inputs)
@@ -302,7 +374,19 @@ class Agent(metaclass=AutoTracedMeta):
                 raise
         return current
-    async def _run_engines(self, ctx: Context, inputs: EvalInputs) -> EvalResult:
+    async def _run_engines(
+        self, ctx: Context, inputs: EvalInputs, output_group: OutputGroup
+    ) -> EvalResult:
+        """Execute engines for a specific OutputGroup.
+        Args:
+            ctx: Execution context
+            inputs: EvalInputs with input artifacts
+            output_group: The OutputGroup defining what artifacts to produce
+        Returns:
+            EvalResult with artifacts matching output_group specifications
+        """
         engines = self._resolve_engines()
         if not engines:
             return EvalResult(artifacts=inputs.artifacts, state=inputs.state)
@@ -313,26 +397,10 @@ class Agent(metaclass=AutoTracedMeta):
             accumulated_metrics: dict[str, float] = {}
             for engine in engines:
                 current_inputs = await engine.on_pre_evaluate(self, ctx, current_inputs)
-                use_batch_mode = bool(getattr(ctx, "is_batch", False))
-                try:
-                    if use_batch_mode:
-                        logger.debug(
-                            "Agent %s: routing %d artifacts to %s.evaluate_batch",
-                            self.name,
-                            len(current_inputs.artifacts),
-                            engine.__class__.__name__,
-                        )
-                        result = await engine.evaluate_batch(self, ctx, current_inputs)
-                    else:
-                        result = await engine.evaluate(self, ctx, current_inputs)
-                except NotImplementedError:
-                    if use_batch_mode:
-                        logger.exception(
-                            "Agent %s: engine %s does not implement evaluate_batch()",
-                            self.name,
-                            engine.__class__.__name__,
-                        )
-                    raise
+                # Phase 7: Single evaluation path with auto-detection
+                # Engine's evaluate() auto-detects batching via ctx.is_batch
+                result = await engine.evaluate(self, ctx, current_inputs, output_group)
                 # AUTO-WRAP: If engine returns BaseModel instead of EvalResult, wrap it
                 from flock.runtime import EvalResult as ER
@@ -392,29 +460,177 @@ class Agent(metaclass=AutoTracedMeta):
         return current
     async def _make_outputs(self, ctx: Context, result: EvalResult) -> list[Artifact]:
-        if not self.outputs:
+        if not self.output_groups:
             # Utility agents may not publish anything
             return list(result.artifacts)
         produced: list[Artifact] = []
-        for output_decl in self.outputs:
-            # Phase 6: Find the matching artifact from engine result to preserve its ID
-            matching_artifact = self._find_matching_artifact(output_decl, result)
-            payload = self._select_payload(output_decl, result)
-            if payload is None:
-                continue
-            metadata = {
-                "correlation_id": ctx.correlation_id,
-            }
-            # Phase 6: Preserve artifact ID from engine (for streaming message preview)
-            if matching_artifact:
-                metadata["artifact_id"] = matching_artifact.id
-            artifact = output_decl.apply(payload, produced_by=self.name, metadata=metadata)
-            produced.append(artifact)
-            await ctx.board.publish(artifact)
+        # For Phase 2: Iterate ALL output_groups (even though we only have 1 engine call)
+        # Phase 3 will modify this to call engine once PER group
+        for output_group in self.output_groups:
+            for output_decl in output_group.outputs:
+                # Phase 6: Find the matching artifact from engine result to preserve its ID
+                matching_artifact = self._find_matching_artifact(output_decl, result)
+                payload = self._select_payload(output_decl, result)
+                if payload is None:
+                    continue
+                metadata = {
+                    "correlation_id": ctx.correlation_id,
+                }
+                # Phase 6: Preserve artifact ID from engine (for streaming message preview)
+                if matching_artifact:
+                    metadata["artifact_id"] = matching_artifact.id
+                artifact = output_decl.apply(payload, produced_by=self.name, metadata=metadata)
+                produced.append(artifact)
+                await ctx.board.publish(artifact)
+        return produced
+    def _prepare_group_context(
+        self, ctx: Context, group_idx: int, output_group: OutputGroup
+    ) -> Context:
+        """Phase 3: Prepare context specific to this OutputGroup.
+        Creates a modified context for this group's engine call, potentially
+        with group-specific instructions or metadata.
+        Args:
+            ctx: Base context
+            group_idx: Index of this group (0-based)
+            output_group: The OutputGroup being processed
+        Returns:
+            Context for this group (may be the same instance or modified)
+        """
+        # For now, return the same context
+        # Phase 4 will add group-specific system prompts here
+        # Future: ctx.clone() and add group_description to system prompt
+        return ctx
+    async def _make_outputs_for_group(
+        self, ctx: Context, result: EvalResult, output_group: OutputGroup
+    ) -> list[Artifact]:
+        """Phase 3/5: Validate, filter, and publish artifacts for specific OutputGroup.
+        This function:
+        1. Validates that the engine fulfilled its contract (produced expected count)
+        2. Applies WHERE filtering (reduces artifacts, no error)
+        3. Applies VALIDATE checks (raises ValueError if validation fails)
+        4. Applies visibility (static or dynamic)
+        5. Publishes artifacts to the board
+        Args:
+            ctx: Context for this group
+            result: EvalResult from engine for THIS group
+            output_group: OutputGroup defining expected outputs
+        Returns:
+            List of artifacts matching this group's outputs
+        Raises:
+            ValueError: If engine violated contract or validation failed
+        """
+        produced: list[Artifact] = []
+        for output_decl in output_group.outputs:
+            # 1. Find ALL matching artifacts for this type
+            from flock.registry import type_registry
+            expected_canonical = type_registry.resolve_name(output_decl.spec.type_name)
+            matching_artifacts: list[Artifact] = []
+            for artifact in result.artifacts:
+                try:
+                    artifact_canonical = type_registry.resolve_name(artifact.type)
+                    if artifact_canonical == expected_canonical:
+                        matching_artifacts.append(artifact)
+                except Exception:
+                    if artifact.type == output_decl.spec.type_name:
+                        matching_artifacts.append(artifact)
+            # 2. STRICT VALIDATION: Engine must produce exactly what was promised
+            # (This happens BEFORE filtering so engine contract is validated first)
+            expected_count = output_decl.count
+            actual_count = len(matching_artifacts)
+            if actual_count != expected_count:
+                raise ValueError(
+                    f"Engine contract violation in agent '{self.name}': "
+                    f"Expected {expected_count} artifact(s) of type '{output_decl.spec.type_name}', "
+                    f"but engine produced {actual_count}. "
+                    f"Check your engine implementation to ensure it generates the correct number of outputs."
+                )
+            # 3. Apply WHERE filtering (Phase 5)
+            # Filtering reduces the number of published artifacts (this is intentional)
+            # NOTE: Predicates expect Pydantic model instances, not dicts
+            model_cls = type_registry.resolve(output_decl.spec.type_name)
+            if output_decl.filter_predicate:
+                original_count = len(matching_artifacts)
+                filtered = []
+                for a in matching_artifacts:
+                    # Reconstruct Pydantic model from payload dict
+                    model_instance = model_cls(**a.payload)
+                    if output_decl.filter_predicate(model_instance):
+                        filtered.append(a)
+                matching_artifacts = filtered
+                logger.debug(
+                    f"Agent {self.name}: WHERE filter reduced artifacts from "
+                    f"{original_count} to {len(matching_artifacts)} for type {output_decl.spec.type_name}"
+                )
+            # 4. Apply VALIDATE checks (Phase 5)
+            # Validation failures raise errors (fail-fast)
+            if output_decl.validate_predicate:
+                if callable(output_decl.validate_predicate):
+                    # Single predicate
+                    for artifact in matching_artifacts:
+                        # Reconstruct Pydantic model from payload dict
+                        model_instance = model_cls(**artifact.payload)
+                        if not output_decl.validate_predicate(model_instance):
+                            raise ValueError(
+                                f"Validation failed for {output_decl.spec.type_name} "
+                                f"in agent '{self.name}'"
+                            )
+                elif isinstance(output_decl.validate_predicate, list):
+                    # List of (callable, error_msg) tuples
+                    for artifact in matching_artifacts:
+                        # Reconstruct Pydantic model from payload dict
+                        model_instance = model_cls(**artifact.payload)
+                        for check, error_msg in output_decl.validate_predicate:
+                            if not check(model_instance):
+                                raise ValueError(f"{error_msg}: {output_decl.spec.type_name}")
+            # 5. Apply visibility and publish artifacts (Phase 5)
+            for artifact_from_engine in matching_artifacts:
+                metadata = {
+                    "correlation_id": ctx.correlation_id,
+                    "artifact_id": artifact_from_engine.id,  # Preserve engine's ID
+                }
+                # Determine visibility (static or dynamic)
+                visibility = output_decl.default_visibility
+                if callable(visibility):
+                    # Dynamic visibility based on artifact content
+                    # Reconstruct Pydantic model from payload dict
+                    model_instance = model_cls(**artifact_from_engine.payload)
+                    visibility = visibility(model_instance)
+                # Override metadata visibility
+                metadata["visibility"] = visibility
+                # Re-wrap the artifact with agent metadata
+                artifact = output_decl.apply(
+                    artifact_from_engine.payload, produced_by=self.name, metadata=metadata
+                )
+                produced.append(artifact)
+                await ctx.board.publish(artifact)
         return produced
     async def _run_post_publish(self, ctx: Context, artifacts: Sequence[Artifact]) -> None:
@@ -453,9 +669,16 @@ class Agent(metaclass=AutoTracedMeta):
         for component in self._sorted_utilities():
             comp_name = self._component_display_name(component)
             priority = getattr(component, "priority", 0)
+            # Python 3.12+ TaskGroup raises BaseExceptionGroup - extract sub-exceptions
+            error_detail = str(error)
+            if isinstance(error, BaseExceptionGroup):
+                sub_exceptions = [f"{type(e).__name__}: {e}" for e in error.exceptions]
+                error_detail = f"{error!s} - Sub-exceptions: {sub_exceptions}"
             logger.debug(
                 f"Agent error hook: agent={self.name}, component={comp_name}, "
-                f"priority={priority}, error={error!s}"
+                f"priority={priority}, error={error_detail}"
             )
             try:
                 await component.on_error(self, ctx, error)
@@ -699,43 +922,34 @@ class AgentBuilder:
         return self
     def publishes(
-        self, *types: type[BaseModel], visibility: Visibility | None = None
+        self,
+        *types: type[BaseModel],
+        visibility: Visibility | Callable[[BaseModel], Visibility] | None = None,
+        fan_out: int | None = None,
+        where: Callable[[BaseModel], bool] | None = None,
+        validate: Callable[[BaseModel], bool] | list[tuple[Callable, str]] | None = None,
+        description: str | None = None,
     ) -> PublishBuilder:
         """Declare which artifact types this agent produces.
-        Configures the output types and default visibility controls for artifacts
-        published by this agent. Can chain with .where() for conditional publishing.
         Args:
             *types: Artifact types (Pydantic models) to publish
-            visibility: Default visibility control for all outputs. Defaults to PublicVisibility.
-                Can be overridden per-publish or with .where() chaining.
+            visibility: Default visibility control OR callable for dynamic visibility
+            fan_out: Number of artifacts to publish (applies to ALL types)
+            where: Filter predicate for output artifacts
+            validate: Validation predicate(s) - callable or list of (callable, error_msg) tuples
+            description: Group-level description override
         Returns:
             PublishBuilder for conditional publishing configuration
         Examples:
-            >>> # Basic output declaration
-            >>> agent.publishes(Report)
-            >>> # Multiple output types
-            >>> agent.publishes(Summary, DetailedReport, Alert)
-            >>> # Private outputs (only specific agents can see)
-            >>> agent.publishes(
-            ...     SecretData,
-            ...     visibility=PrivateVisibility(agents={"admin", "auditor"})
-            ... )
-            >>> # Tenant-isolated outputs
-            >>> agent.publishes(
-            ...     Invoice,
-            ...     visibility=TenantVisibility()
-            ... )
-            >>> # Conditional publishing with chaining
-            >>> (agent.publishes(Alert)
-            ...  .where(lambda result: result.severity == "critical"))
+            >>> agent.publishes(Report)  # Publish 1 Report
+            >>> agent.publishes(Task, Task, Task)  # Publish 3 Tasks (duplicate counting)
+            >>> agent.publishes(Task, fan_out=3)  # Same as above (sugar syntax)
+            >>> agent.publishes(Task, where=lambda t: t.priority > 5)  # With filtering
+            >>> agent.publishes(Report, validate=lambda r: r.score > 0)  # With validation
+            >>> agent.publishes(Task, description="Special instructions")  # With description
         See Also:
             - PublicVisibility: Default, visible to all agents
@@ -743,14 +957,59 @@ class AgentBuilder:
             - TenantVisibility: Multi-tenant isolation
             - LabelledVisibility: Role-based access control
         """
-        outputs = []
-        for model in types:
-            spec = ArtifactSpec.from_model(model)
-            output = AgentOutput(spec=spec, default_visibility=ensure_visibility(visibility))
-            self._agent.outputs.append(output)
-            outputs.append(output)
-        # T074: Validate configuration after adding outputs
+        # Validate fan_out if provided
+        if fan_out is not None and fan_out < 1:
+            raise ValueError(f"fan_out must be >= 1, got {fan_out}")
+        # Resolve visibility
+        resolved_visibility = (
+            ensure_visibility(visibility) if not callable(visibility) else visibility
+        )
+        # Create AgentOutput objects for this group
+        outputs: list[AgentOutput] = []
+        if fan_out is not None:
+            # Apply fan_out to ALL types
+            for model in types:
+                spec = ArtifactSpec.from_model(model)
+                output = AgentOutput(
+                    spec=spec,
+                    default_visibility=resolved_visibility,
+                    count=fan_out,
+                    filter_predicate=where,
+                    validate_predicate=validate,
+                    group_description=description,
+                )
+                outputs.append(output)
+        else:
+            # Create separate AgentOutput for each type (including duplicates)
+            # This preserves order: .publishes(A, B, A) → [A, B, A] (3 outputs)
+            for model in types:
+                spec = ArtifactSpec.from_model(model)
+                output = AgentOutput(
+                    spec=spec,
+                    default_visibility=resolved_visibility,
+                    count=1,
+                    filter_predicate=where,
+                    validate_predicate=validate,
+                    group_description=description,
+                )
+                outputs.append(output)
+        # Create OutputGroup from outputs
+        group = OutputGroup(
+            outputs=outputs,
+            shared_visibility=resolved_visibility if not callable(resolved_visibility) else None,
+            group_description=description,
+        )
+        # Append to agent's output_groups
+        self._agent.output_groups.append(group)
+        # Validate configuration
         self._validate_self_trigger_risk()
         return PublishBuilder(self, outputs)
     def with_utilities(self, *components: AgentComponent) -> AgentBuilder:
@@ -1081,7 +1340,9 @@ class AgentBuilder:
             consuming_types.update(sub.type_names)
         # Get types agent publishes
-        publishing_types = {output.spec.type_name for output in self._agent.outputs}
+        publishing_types = {
+            output.spec.type_name for group in self._agent.output_groups for output in group.outputs
+        }
         # Check for overlap
         overlap = consuming_types.intersection(publishing_types)
@@ -1225,4 +1486,6 @@ class Pipeline:
 __all__ = [
     "Agent",
     "AgentBuilder",
+    "AgentOutput",
+    "OutputGroup",
 ]

flock/artifacts.py CHANGED Viewed

@@ -2,7 +2,7 @@
 from __future__ import annotations
-from datetime import datetime, timezone
+from datetime import UTC, datetime
 from typing import Any
 from uuid import UUID, uuid4
@@ -23,7 +23,7 @@ class Artifact(BaseModel):
     partition_key: str | None = None
     tags: set[str] = Field(default_factory=set)
     visibility: Visibility = Field(default_factory=lambda: ensure_visibility(None))
-    created_at: datetime = Field(default_factory=lambda: datetime.now(timezone.utc))
+    created_at: datetime = Field(default_factory=lambda: datetime.now(UTC))
     version: int = 1
     def model_dump_payload(self) -> dict[str, Any]:  # pragma: no cover - convenience

flock/components.py CHANGED Viewed

@@ -2,11 +2,11 @@
 from __future__ import annotations
-from typing import TYPE_CHECKING, Any
+from typing import TYPE_CHECKING, Any, Self
 from pydantic import BaseModel, Field, create_model
 from pydantic._internal._model_construction import ModelMetaclass
-from typing_extensions import Self, TypeVar
+from typing_extensions import TypeVar
 from flock.logging.auto_trace import AutoTracedMeta
@@ -14,7 +14,7 @@ from flock.logging.auto_trace import AutoTracedMeta
 if TYPE_CHECKING:  # pragma: no cover - type checking only
     from uuid import UUID
-    from flock.agent import Agent
+    from flock.agent import Agent, OutputGroup
     from flock.artifacts import Artifact
     from flock.runtime import Context, EvalInputs, EvalResult
@@ -109,41 +109,49 @@ class EngineComponent(AgentComponent):
         default_factory=set, description="Artifact types to exclude from context"
     )
-    async def evaluate(self, agent: Agent, ctx: Context, inputs: EvalInputs) -> EvalResult:
-        """Override this method in your engine implementation."""
-        raise NotImplementedError
+    async def evaluate(
+        self, agent: Agent, ctx: Context, inputs: EvalInputs, output_group: OutputGroup
+    ) -> EvalResult:
+        """Universal evaluation method with auto-detection of batch and fan-out modes.
-    async def evaluate_batch(self, agent: Agent, ctx: Context, inputs: EvalInputs) -> EvalResult:
-        """Process batch of accumulated artifacts (BatchSpec).
+        This single method handles ALL evaluation scenarios:
+        - Single artifact → single output
+        - Batch processing (ctx.is_batch=True) → list[Type] signatures
+        - Fan-out (output_group.outputs[*].count > 1) → multiple artifacts
+        - Multi-output (len(output_group.outputs) > 1) → multiple types
-        Override this method if your engine supports batch processing.
+        Auto-detection happens automatically:
+        - Batching: Detected via ctx.is_batch flag
+        - Fan-out: Detected via output_group.outputs[*].count
+        - Multi-input: Detected via len(inputs.artifacts)
+        - Multi-output: Detected via len(output_group.outputs)
         Args:
             agent: Agent instance executing this engine
-            ctx: Execution context (ctx.is_batch will be True)
-            inputs: EvalInputs with inputs.artifacts containing batch items
+            ctx: Execution context (check ctx.is_batch for batch mode)
+            inputs: EvalInputs with input artifacts
+            output_group: OutputGroup defining what artifacts to produce
+                         (inspect outputs[*].count for fan-out detection)
         Returns:
-            EvalResult with processed artifacts
-        Raises:
-            NotImplementedError: If engine doesn't support batching
-        Example:
-            >>> async def evaluate_batch(self, agent, ctx, inputs):
-            ...     events = inputs.all_as(Event)  # Get ALL items
-            ...     results = await bulk_process(events)
-            ...     return EvalResult.from_objects(*results, agent=agent)
+            EvalResult with artifacts matching output_group specifications
+        Implementation Guide:
+            >>> async def evaluate(self, agent, ctx, inputs, output_group):
+            ...     # Auto-detect batching from context
+            ...     batched = bool(getattr(ctx, "is_batch", False))
+            ...
+            ...     # Fan-out is auto-detected from output_group
+            ...     # Your signature building should check:
+            ...     # - output_group.outputs[i].count > 1 for fan-out
+            ...     # - len(output_group.outputs) > 1 for multi-output
+            ...
+            ...     # Build signature adapting to all modes
+            ...     signature = self._build_signature(inputs, output_group, batched)
+            ...     result = await self._execute(signature, inputs)
+            ...     return EvalResult.from_objects(*result, agent=agent)
         """
-        raise NotImplementedError(
-            f"{self.__class__.__name__} does not support batch processing.\n\n"
-            f"To fix this:\n"
-            f"1. Remove BatchSpec from agent subscription, OR\n"
-            f"2. Implement evaluate_batch() in {self.__class__.__name__}, OR\n"
-            f"3. Use a batch-aware engine (e.g., CustomBatchEngine)\n\n"
-            f"Agent: {agent.name}\n"
-            f"Engine: {self.__class__.__name__}"
-        )
+        raise NotImplementedError
     async def fetch_conversation_context(
         self,

flock-core 0.5.6__py3-none-any.whl → 0.5.8__py3-none-any.whl

Potentially problematic release.

flock-core 0.5.6py3-none-any.whl → 0.5.8py3-none-any.whl