PyPI - flock-core - Versions diffs - 0.5.2__py3-none-any.whl → 0.5.3__py3-none-any.whl - Mend

flock-core 0.5.2py3-none-any.whl → 0.5.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of flock-core might be problematic. Click here for more details.

Files changed (11) hide show

flock/agent.py +16 -3
flock/artifact_collector.py +159 -0
flock/batch_accumulator.py +252 -0
flock/correlation_engine.py +218 -0
flock/orchestrator.py +137 -3
flock/subscription.py +70 -7
{flock_core-0.5.2.dist-info → flock_core-0.5.3.dist-info}/METADATA +62 -14
{flock_core-0.5.2.dist-info → flock_core-0.5.3.dist-info}/RECORD +11 -8
{flock_core-0.5.2.dist-info → flock_core-0.5.3.dist-info}/WHEEL +0 -0
{flock_core-0.5.2.dist-info → flock_core-0.5.3.dist-info}/entry_points.txt +0 -0
{flock_core-0.5.2.dist-info → flock_core-0.5.3.dist-info}/licenses/LICENSE +0 -0

flock/agent.py CHANGED Viewed

@@ -988,10 +988,23 @@ class AgentBuilder:
     def _normalize_join(self, value: dict | JoinSpec | None) -> JoinSpec | None:
         if value is None or isinstance(value, JoinSpec):
             return value
+        # Phase 2: New JoinSpec API with 'by' and 'within' (time OR count)
+        from datetime import timedelta
+        within_value = value.get("within")
+        if isinstance(within_value, (int, float)):
+            # Count window or seconds as float - keep as is
+            within = (
+                int(within_value)
+                if isinstance(within_value, int)
+                else timedelta(seconds=within_value)
+            )
+        else:
+            # Default to 1 minute time window
+            within = timedelta(minutes=1)
         return JoinSpec(
-            kind=value.get("kind", "all_of"),
-            window=float(value.get("window", 0.0)),
-            by=value.get("by"),
+            by=value["by"],  # Required
+            within=within,
         )
     def _normalize_batch(self, value: dict | BatchSpec | None) -> BatchSpec | None:

flock/artifact_collector.py ADDED Viewed

@@ -0,0 +1,159 @@
+"""Artifact collection and waiting pool management for AND gate logic.
+This module implements the waiting pool mechanism that enables `.consumes(A, B)`
+to wait for BOTH types before triggering an agent (AND gate logic).
+Architecture:
+- Each subscription gets a unique waiting pool identified by (agent_name, subscription_index)
+- Artifacts are collected per type until all required types are present
+- When complete, all collected artifacts are returned for agent execution
+- After triggering, the waiting pool is cleared for the next cycle
+"""
+from __future__ import annotations
+from collections import defaultdict
+from typing import TYPE_CHECKING
+if TYPE_CHECKING:
+    from flock.agent import Agent
+    from flock.artifacts import Artifact
+    from flock.subscription import Subscription
+class ArtifactCollector:
+    """Manages waiting pools for multi-type subscriptions (AND gate logic).
+    Each subscription with multiple types gets a waiting pool that collects
+    artifacts until all required types are present. Single-type subscriptions
+    bypass the waiting pool for immediate triggering.
+    Example:
+        agent.consumes(TypeA, TypeB)  # Creates waiting pool for 2 types
+        # TypeA published → added to pool (not complete yet)
+        # TypeB published → added to pool (NOW complete!)
+        # → Agent triggered with [TypeA_artifact, TypeB_artifact]
+        # → Waiting pool cleared for next cycle
+    """
+    def __init__(self) -> None:
+        """Initialize empty waiting pools."""
+        # Structure: {(agent_name, subscription_index): {type_name: [artifact1, artifact2, ...]}}
+        # Example: {("diagnostician", 0): {"XRay": [artifact1], "LabResult": [artifact2]}}
+        # For count-based AND gates: {"TypeA": [artifact1, artifact2, artifact3]} (3 As collected)
+        self._waiting_pools: dict[tuple[str, int], dict[str, list[Artifact]]] = defaultdict(
+            lambda: defaultdict(list)
+        )
+    def add_artifact(
+        self,
+        agent: Agent,
+        subscription: Subscription,
+        artifact: Artifact,
+    ) -> tuple[bool, list[Artifact]]:
+        """Add artifact to waiting pool and check for completeness.
+        Args:
+            agent: Agent that will process the artifacts
+            subscription: Subscription that matched the artifact
+            artifact: Artifact to add to the waiting pool
+        Returns:
+            Tuple of (is_complete, artifacts):
+                - is_complete: True if all required types are now present
+                - artifacts: List of collected artifacts (empty if incomplete, all artifacts if complete)
+        Design Notes:
+            - Single-type subscriptions with count=1 bypass the pool and return immediately complete
+            - Multi-type or count-based subscriptions collect artifacts until all required counts met
+            - Latest artifacts win (keeps most recent N artifacts per type)
+            - After returning complete=True, the pool is automatically cleared
+        """
+        # Single-type subscription with count=1: No waiting needed (immediate trigger)
+        if len(subscription.type_names) == 1 and subscription.type_counts[artifact.type] == 1:
+            return (True, [artifact])
+        # Multi-type or count-based subscription: Use waiting pool (AND gate logic)
+        # Find subscription index (agents can have multiple subscriptions)
+        try:
+            subscription_index = agent.subscriptions.index(subscription)
+        except ValueError:
+            # Should never happen, but defensive programming
+            raise RuntimeError(
+                f"Subscription not found in agent {agent.name}. "
+                "This indicates an internal orchestrator error."
+            )
+        pool_key = (agent.name, subscription_index)
+        # Add artifact to pool (collect in list for count-based logic)
+        self._waiting_pools[pool_key][artifact.type].append(artifact)
+        # Check if all required counts are met
+        is_complete = True
+        for type_name, required_count in subscription.type_counts.items():
+            collected_count = len(self._waiting_pools[pool_key][type_name])
+            if collected_count < required_count:
+                is_complete = False
+                break
+        if is_complete:
+            # Complete! Collect all artifacts (flatten lists) and clear the pool
+            artifacts = []
+            for type_name, required_count in subscription.type_counts.items():
+                # Take exactly the required count (latest artifacts)
+                type_artifacts = self._waiting_pools[pool_key][type_name]
+                artifacts.extend(type_artifacts[:required_count])
+            del self._waiting_pools[pool_key]  # Clear for next cycle
+            return (True, artifacts)
+        else:
+            # Incomplete - still waiting for more artifacts
+            return (False, [])
+    def get_waiting_status(
+        self, agent: Agent, subscription_index: int
+    ) -> dict[str, list[Artifact]]:
+        """Get current waiting pool contents for debugging/inspection.
+        Args:
+            agent: Agent to inspect
+            subscription_index: Index of the subscription
+        Returns:
+            Dictionary mapping type names to lists of collected artifacts (empty if none)
+        """
+        pool_key = (agent.name, subscription_index)
+        # Return a copy to prevent external mutation
+        pool = self._waiting_pools.get(pool_key, {})
+        return {type_name: list(artifacts) for type_name, artifacts in pool.items()}
+    def clear_waiting_pool(self, agent: Agent, subscription_index: int) -> None:
+        """Manually clear a waiting pool.
+        Useful for cleanup or resetting agent state.
+        Args:
+            agent: Agent whose pool to clear
+            subscription_index: Index of the subscription
+        """
+        pool_key = (agent.name, subscription_index)
+        if pool_key in self._waiting_pools:
+            del self._waiting_pools[pool_key]
+    def clear_all_pools(self) -> None:
+        """Clear all waiting pools.
+        Useful for orchestrator shutdown or test cleanup.
+        """
+        self._waiting_pools.clear()
+    def get_pool_count(self) -> int:
+        """Get total number of active waiting pools (for metrics/debugging)."""
+        return len(self._waiting_pools)
+__all__ = ["ArtifactCollector"]

flock/batch_accumulator.py ADDED Viewed

@@ -0,0 +1,252 @@
+"""
+BatchAccumulator: Manages batch collection with size/timeout triggers.
+Supports BatchSpec-based batching:
+- Accumulates artifacts in batches per subscription
+- Flushes on size threshold (e.g., batch of 25)
+- Flushes on timeout (e.g., every 30 seconds)
+- Whichever comes first wins
+- Ensures zero data loss on shutdown
+"""
+from __future__ import annotations
+from collections import defaultdict
+from datetime import datetime, timedelta
+from typing import TYPE_CHECKING
+if TYPE_CHECKING:
+    from flock.artifacts import Artifact
+    from flock.subscription import BatchSpec, Subscription
+class BatchAccumulator:
+    """
+    Tracks artifact batches waiting for size/timeout triggers.
+    Example: For orders, accumulate 25 at a time to batch process payments.
+    When 25th order arrives OR 30 seconds elapse, flush the batch.
+    """
+    def __init__(
+        self,
+        *,
+        batch_spec: BatchSpec,
+        created_at: datetime,
+    ):
+        self.batch_spec = batch_spec
+        self.created_at = created_at  # When first artifact arrived
+        self.artifacts: list[Artifact] = []
+    def add_artifact(self, artifact: Artifact) -> bool:
+        """
+        Add artifact to batch.
+        Returns:
+            True if batch should flush (size threshold reached), False otherwise
+        """
+        self.artifacts.append(artifact)
+        # Check size threshold
+        if self.batch_spec.size is not None:
+            if len(self.artifacts) >= self.batch_spec.size:
+                return True  # Flush now (size threshold reached)
+        return False  # Not ready to flush yet
+    def is_timeout_expired(self) -> bool:
+        """Check if timeout has expired since batch started."""
+        if self.batch_spec.timeout is None:
+            return False
+        elapsed = datetime.now() - self.created_at
+        return elapsed >= self.batch_spec.timeout
+    def get_artifacts(self) -> list[Artifact]:
+        """Get all artifacts in batch."""
+        return self.artifacts.copy()
+    def clear(self) -> None:
+        """Clear the batch after flush."""
+        self.artifacts.clear()
+class BatchEngine:
+    """
+    Manages batch state for BatchSpec subscriptions.
+    Responsibilities:
+    1. Accumulate artifacts per (agent, subscription_index)
+    2. Track batch size and timeout per batch
+    3. Return complete batches when size or timeout threshold met
+    4. Provide shutdown flush for partial batches
+    Example usage:
+        engine = BatchEngine()
+        # Add artifact to batch
+        should_flush = engine.add_artifact(
+            artifact=order_artifact,
+            subscription=subscription,  # Has BatchSpec
+            subscription_index=0,
+        )
+        if should_flush:
+            # Size threshold reached! Flush batch
+            artifacts = engine.flush_batch("agent_name", 0)
+            # Trigger agent with batch
+    """
+    def __init__(self):
+        # Batch state per (agent_name, subscription_index)
+        # Key: (agent_name, subscription_index)
+        # Value: BatchAccumulator
+        self.batches: dict[tuple[str, int], BatchAccumulator] = {}
+    def add_artifact(
+        self,
+        *,
+        artifact: Artifact,
+        subscription: Subscription,
+        subscription_index: int,
+    ) -> bool:
+        """
+        Add artifact to batch accumulator.
+        Returns:
+            True if batch should flush (size threshold reached), False otherwise
+        """
+        if subscription.batch is None:
+            raise ValueError("Subscription must have BatchSpec for batching")
+        batch_key = (subscription.agent_name, subscription_index)
+        # Get or create batch accumulator
+        if batch_key not in self.batches:
+            self.batches[batch_key] = BatchAccumulator(
+                batch_spec=subscription.batch,
+                created_at=datetime.now(),
+            )
+        accumulator = self.batches[batch_key]
+        # Add artifact to batch
+        should_flush = accumulator.add_artifact(artifact)
+        return should_flush
+    def add_artifact_group(
+        self,
+        *,
+        artifacts: list[Artifact],
+        subscription: Subscription,
+        subscription_index: int,
+    ) -> bool:
+        """
+        Add a GROUP of artifacts (e.g., correlated pair) as a SINGLE batch item.
+        This is used for JoinSpec + BatchSpec combinations where we want to batch
+        correlated groups, not individual artifacts.
+        Example: JoinSpec + BatchSpec(size=2) means "batch 2 correlated pairs",
+                 not "batch 2 individual artifacts".
+        Returns:
+            True if batch should flush (size threshold reached), False otherwise
+        """
+        if subscription.batch is None:
+            raise ValueError("Subscription must have BatchSpec for batching")
+        batch_key = (subscription.agent_name, subscription_index)
+        # Get or create batch accumulator
+        if batch_key not in self.batches:
+            self.batches[batch_key] = BatchAccumulator(
+                batch_spec=subscription.batch,
+                created_at=datetime.now(),
+            )
+        accumulator = self.batches[batch_key]
+        # Add ALL artifacts from the group
+        for artifact in artifacts:
+            accumulator.artifacts.append(artifact)
+        # Check size threshold - count GROUPS, not artifacts
+        # We track how many groups have been added by checking batch_spec metadata
+        if subscription.batch.size is not None:
+            # For group batching, we need to track group count separately
+            # For now, we'll use a simple heuristic: count groups by dividing by expected group size
+            # But this is NOT perfect - we need better tracking
+            # BETTER APPROACH: Count how many times we've called add_artifact_group
+            # For now, let's use artifact count as a proxy and check if we've hit the threshold
+            # This will work correctly if all groups are the same size
+            # Actually, let's track group count properly:
+            if not hasattr(accumulator, '_group_count'):
+                accumulator._group_count = 0
+            accumulator._group_count += 1
+            if accumulator._group_count >= subscription.batch.size:
+                return True  # Flush now
+        return False  # Not ready to flush yet
+    def flush_batch(self, agent_name: str, subscription_index: int) -> list[Artifact] | None:
+        """
+        Flush a batch and return its artifacts.
+        Returns:
+            List of artifacts in batch, or None if no batch exists
+        """
+        batch_key = (agent_name, subscription_index)
+        accumulator = self.batches.get(batch_key)
+        if accumulator is None or not accumulator.artifacts:
+            return None
+        # Get artifacts and clear batch
+        artifacts = accumulator.get_artifacts()
+        del self.batches[batch_key]
+        return artifacts
+    def check_timeouts(self) -> list[tuple[str, int]]:
+        """
+        Check all batches for timeout expiry.
+        Returns:
+            List of (agent_name, subscription_index) tuples that should flush
+        """
+        expired = []
+        for batch_key, accumulator in list(self.batches.items()):
+            if accumulator.is_timeout_expired():
+                expired.append(batch_key)
+        return expired
+    def flush_all(self) -> list[tuple[str, int, list[Artifact]]]:
+        """
+        Flush ALL partial batches (for shutdown).
+        Returns:
+            List of (agent_name, subscription_index, artifacts) tuples
+        """
+        results = []
+        for batch_key, accumulator in list(self.batches.items()):
+            if accumulator.artifacts:
+                artifacts = accumulator.get_artifacts()
+                agent_name, subscription_index = batch_key
+                results.append((agent_name, subscription_index, artifacts))
+        # Clear all batches after flush
+        self.batches.clear()
+        return results
+__all__ = ["BatchEngine", "BatchAccumulator"]

flock/correlation_engine.py ADDED Viewed

@@ -0,0 +1,218 @@
+"""
+CorrelationEngine: Manages correlated AND gates with time/count windows.
+Supports JoinSpec-based correlation:
+- Extracts correlation keys from artifacts
+- Groups artifacts by correlation key
+- Enforces time windows (timedelta) or count windows (int)
+- Triggers agents when all required types arrive within window
+"""
+from __future__ import annotations
+from collections import defaultdict
+from datetime import datetime, timedelta
+from typing import TYPE_CHECKING, Any
+if TYPE_CHECKING:
+    from flock.artifacts import Artifact
+    from flock.subscription import JoinSpec, Subscription
+class CorrelationGroup:
+    """
+    Tracks artifacts waiting for correlation within a specific key group.
+    Example: For patient-123, track X-ray (TypeA) and Lab results (TypeB).
+    When both arrive within time/count window, trigger the agent.
+    """
+    def __init__(
+        self,
+        *,
+        correlation_key: Any,
+        required_types: set[str],
+        type_counts: dict[str, int],
+        window_spec: timedelta | int,
+        created_at_sequence: int,
+    ):
+        self.correlation_key = correlation_key
+        self.required_types = required_types  # e.g., {"TypeA", "TypeB"}
+        self.type_counts = type_counts  # e.g., {"TypeA": 1, "TypeB": 1}
+        self.window_spec = window_spec  # timedelta or int
+        self.created_at_sequence = (
+            created_at_sequence  # Global sequence when first artifact arrived
+        )
+        self.created_at_time: datetime | None = None  # Timestamp when first artifact arrived
+        # Waiting pool: type -> list of artifacts
+        self.waiting_artifacts: dict[str, list[Artifact]] = defaultdict(list)
+    def add_artifact(self, artifact: Artifact, current_sequence: int) -> None:
+        """Add artifact to this correlation group's waiting pool."""
+        if self.created_at_time is None:
+            self.created_at_time = datetime.now()
+        self.waiting_artifacts[artifact.type].append(artifact)
+    def is_complete(self) -> bool:
+        """Check if all required types have arrived with correct counts."""
+        for type_name, required_count in self.type_counts.items():
+            if len(self.waiting_artifacts.get(type_name, [])) < required_count:
+                return False
+        return True
+    def is_expired(self, current_sequence: int) -> bool:
+        """Check if this correlation group has expired based on window."""
+        if isinstance(self.window_spec, int):
+            # Count window: expired if current sequence exceeds created + window
+            return (current_sequence - self.created_at_sequence) > self.window_spec
+        elif isinstance(self.window_spec, timedelta):
+            # Time window: expired if current time exceeds created + window
+            if self.created_at_time is None:
+                return False
+            elapsed = datetime.now() - self.created_at_time
+            return elapsed > self.window_spec
+        return False
+    def get_artifacts(self) -> list[Artifact]:
+        """Get all artifacts in the order they should be passed to the agent."""
+        result = []
+        for type_name in self.required_types:
+            # Get the required number of artifacts for this type
+            required_count = self.type_counts[type_name]
+            artifacts_for_type = self.waiting_artifacts[type_name][:required_count]
+            result.extend(artifacts_for_type)
+        return result
+class CorrelationEngine:
+    """
+    Manages correlation state for JoinSpec subscriptions.
+    Responsibilities:
+    1. Extract correlation keys from artifacts using JoinSpec.by lambda
+    2. Group artifacts by correlation key
+    3. Track time/count windows per correlation group
+    4. Return complete correlation groups when all types arrive within window
+    5. Clean up expired correlations
+    Example usage:
+        engine = CorrelationEngine()
+        # Add artifact to correlation tracking
+        completed = engine.add_artifact(
+            artifact=xray_artifact,
+            subscription=subscription,  # Has JoinSpec with by + within
+            agent_name="diagnostician"
+        )
+        if completed:
+            # All types arrived! Trigger agent with correlated artifacts
+            artifacts = completed.get_artifacts()
+    """
+    def __init__(self):
+        # Global artifact sequence (for count windows)
+        self.global_sequence = 0
+        # Correlation state per (agent, subscription_index)
+        # Key: (agent_name, subscription_index)
+        # Value: dict[correlation_key, CorrelationGroup]
+        self.correlation_groups: dict[tuple[str, int], dict[Any, CorrelationGroup]] = defaultdict(
+            dict
+        )
+    def add_artifact(
+        self,
+        *,
+        artifact: Artifact,
+        subscription: Subscription,
+        subscription_index: int,
+    ) -> CorrelationGroup | None:
+        """
+        Add artifact to correlation tracking.
+        Returns:
+            CorrelationGroup if correlation is complete, None otherwise
+        """
+        # Increment global sequence (for count windows)
+        self.global_sequence += 1
+        current_sequence = self.global_sequence
+        # Extract correlation key using JoinSpec.by lambda
+        if subscription.join is None:
+            raise ValueError("Subscription must have JoinSpec for correlation")
+        join_spec: JoinSpec = subscription.join
+        # Parse artifact payload to extract correlation key
+        from flock.registry import type_registry
+        model_cls = type_registry.resolve(artifact.type)
+        payload_instance = model_cls(**artifact.payload)
+        try:
+            correlation_key = join_spec.by(payload_instance)
+        except Exception as e:
+            # Key extraction failed - skip this artifact
+            # TODO: Log warning?
+            return None
+        # Get or create correlation group for this key
+        pool_key = (subscription.agent_name, subscription_index)
+        groups = self.correlation_groups[pool_key]
+        if correlation_key not in groups:
+            # Create new correlation group
+            groups[correlation_key] = CorrelationGroup(
+                correlation_key=correlation_key,
+                required_types=subscription.type_names,
+                type_counts=subscription.type_counts,
+                window_spec=join_spec.within,
+                created_at_sequence=current_sequence,
+            )
+        group = groups[correlation_key]
+        # Check if group expired (for count windows, check BEFORE adding)
+        if group.is_expired(current_sequence):
+            # Group expired - remove it and start fresh
+            del groups[correlation_key]
+            # Create new group
+            groups[correlation_key] = CorrelationGroup(
+                correlation_key=correlation_key,
+                required_types=subscription.type_names,
+                type_counts=subscription.type_counts,
+                window_spec=join_spec.within,
+                created_at_sequence=current_sequence,
+            )
+            group = groups[correlation_key]
+        # Add artifact to group
+        group.add_artifact(artifact, current_sequence)
+        # Check if correlation is complete
+        if group.is_complete():
+            # Complete! Remove from tracking and return
+            completed_group = groups.pop(correlation_key)
+            return completed_group
+        # Not complete yet
+        return None
+    def cleanup_expired(self, agent_name: str, subscription_index: int) -> None:
+        """Clean up expired correlation groups for a specific subscription."""
+        pool_key = (agent_name, subscription_index)
+        groups = self.correlation_groups.get(pool_key, {})
+        # Remove expired groups
+        expired_keys = [
+            key for key, group in groups.items() if group.is_expired(self.global_sequence)
+        ]
+        for key in expired_keys:
+            del groups[key]
+__all__ = ["CorrelationEngine", "CorrelationGroup"]

flock/orchestrator.py CHANGED Viewed

@@ -18,7 +18,10 @@ from opentelemetry.trace import Status, StatusCode
 from pydantic import BaseModel
 from flock.agent import Agent, AgentBuilder
+from flock.artifact_collector import ArtifactCollector
 from flock.artifacts import Artifact
+from flock.batch_accumulator import BatchEngine
+from flock.correlation_engine import CorrelationEngine
 from flock.helper.cli_helper import init_console
 from flock.logging.auto_trace import AutoTracedMeta
 from flock.mcp import (
@@ -128,6 +131,12 @@ class Flock(metaclass=AutoTracedMeta):
         self.max_agent_iterations: int = max_agent_iterations
         self._agent_iteration_count: dict[str, int] = {}
         self.is_dashboard: bool = False
+        # AND gate logic: Artifact collection for multi-type subscriptions
+        self._artifact_collector = ArtifactCollector()
+        # JoinSpec logic: Correlation engine for correlated AND gates
+        self._correlation_engine = CorrelationEngine()
+        # BatchSpec logic: Batch accumulator for size/timeout batching
+        self._batch_engine = BatchEngine()
         # Unified tracing support
         self._workflow_span = None
         self._auto_workflow_enabled = os.getenv("FLOCK_AUTO_WORKFLOW_TRACE", "false").lower() in {
@@ -671,7 +680,11 @@ class Flock(metaclass=AutoTracedMeta):
         self.is_dashboard = is_dashboard
         # Only show banner in CLI mode, not dashboard mode
         if not self.is_dashboard:
-            init_console(clear_screen=True, show_banner=True, model=self.model)
+            try:
+                init_console(clear_screen=True, show_banner=True, model=self.model)
+            except (UnicodeEncodeError, UnicodeDecodeError):
+                # Skip banner on Windows consoles with encoding issues (e.g., tests, CI)
+                pass
         # Handle different input types
         if isinstance(obj, Artifact):
             # Already an artifact - publish as-is
@@ -881,10 +894,90 @@ class Flock(metaclass=AutoTracedMeta):
                     continue
                 if self._seen_before(artifact, agent):
                     continue
+                # JoinSpec CORRELATION: Check if subscription has correlated AND gate
+                if subscription.join is not None:
+                    # Use CorrelationEngine for JoinSpec (correlated AND gates)
+                    subscription_index = agent.subscriptions.index(subscription)
+                    completed_group = self._correlation_engine.add_artifact(
+                        artifact=artifact,
+                        subscription=subscription,
+                        subscription_index=subscription_index,
+                    )
+                    if completed_group is None:
+                        # Still waiting for correlation to complete
+                        continue
+                    # Correlation complete! Get all correlated artifacts
+                    artifacts = completed_group.get_artifacts()
+                else:
+                    # AND GATE LOGIC: Use artifact collector for simple AND gates (no correlation)
+                    is_complete, artifacts = self._artifact_collector.add_artifact(
+                        agent, subscription, artifact
+                    )
+                    if not is_complete:
+                        # Still waiting for more types (AND gate incomplete)
+                        continue
+                # BatchSpec BATCHING: Check if subscription has batch accumulator
+                if subscription.batch is not None:
+                    # Add to batch accumulator
+                    subscription_index = agent.subscriptions.index(subscription)
+                    # COMBINED FEATURES: JoinSpec + BatchSpec
+                    # If we have JoinSpec, artifacts is a correlated GROUP - treat as single batch item
+                    # If we have AND gate, artifacts is a complete set - treat as single batch item
+                    # Otherwise (single type), add each artifact individually
+                    if subscription.join is not None or len(subscription.type_models) > 1:
+                        # JoinSpec or AND gate: Treat artifact group as ONE batch item
+                        should_flush = self._batch_engine.add_artifact_group(
+                            artifacts=artifacts,
+                            subscription=subscription,
+                            subscription_index=subscription_index,
+                        )
+                    else:
+                        # Single type subscription: Add each artifact individually
+                        should_flush = False
+                        for single_artifact in artifacts:
+                            should_flush = self._batch_engine.add_artifact(
+                                artifact=single_artifact,
+                                subscription=subscription,
+                                subscription_index=subscription_index,
+                            )
+                            if should_flush:
+                                # Size threshold reached! Flush batch now
+                                break
+                    if not should_flush:
+                        # Batch not full yet - wait for more artifacts
+                        continue
+                    # Flush the batch and get all accumulated artifacts
+                    batched_artifacts = self._batch_engine.flush_batch(
+                        agent.name, subscription_index
+                    )
+                    if batched_artifacts is None:
+                        # No batch to flush (shouldn't happen, but defensive)
+                        continue
+                    # Replace artifacts with batched artifacts
+                    artifacts = batched_artifacts
+                # Complete! Schedule agent with all collected artifacts
                 # T068: Increment iteration counter
                 self._agent_iteration_count[agent.name] = iteration_count + 1
-                self._mark_processed(artifact, agent)
-                self._schedule_task(agent, [artifact])
+                # Mark all artifacts as processed (prevent duplicate triggers)
+                for collected_artifact in artifacts:
+                    self._mark_processed(collected_artifact, agent)
+                # Schedule agent with ALL artifacts (batched, correlated, or AND gate complete)
+                self._schedule_task(agent, artifacts)
     def _schedule_task(self, agent: Agent, artifacts: list[Artifact]) -> None:
         task = asyncio.create_task(self._run_agent_task(agent, artifacts))
@@ -933,6 +1026,47 @@ class Flock(metaclass=AutoTracedMeta):
             except Exception as exc:  # pragma: no cover - defensive logging
                 self._logger.exception("Failed to record artifact consumption: %s", exc)
+    # Batch Helpers --------------------------------------------------------
+    async def _check_batch_timeouts(self) -> None:
+        """Check all batches for timeout expiry and flush expired batches.
+        This method is called periodically or manually (in tests) to enforce
+        timeout-based batching.
+        """
+        expired_batches = self._batch_engine.check_timeouts()
+        for agent_name, subscription_index in expired_batches:
+            # Flush the expired batch
+            artifacts = self._batch_engine.flush_batch(agent_name, subscription_index)
+            if artifacts is None:
+                continue
+            # Get the agent
+            agent = self._agents.get(agent_name)
+            if agent is None:
+                continue
+            # Schedule agent with batched artifacts
+            self._schedule_task(agent, artifacts)
+    async def _flush_all_batches(self) -> None:
+        """Flush all partial batches (for shutdown - ensures zero data loss)."""
+        all_batches = self._batch_engine.flush_all()
+        for agent_name, subscription_index, artifacts in all_batches:
+            # Get the agent
+            agent = self._agents.get(agent_name)
+            if agent is None:
+                continue
+            # Schedule agent with partial batch
+            self._schedule_task(agent, artifacts)
+        # Wait for all scheduled tasks to complete
+        await self.run_until_idle()
     # Helpers --------------------------------------------------------------
     def _normalize_input(

flock/subscription.py CHANGED Viewed

@@ -4,6 +4,7 @@ from __future__ import annotations
 from collections.abc import Callable, Iterable, Sequence
 from dataclasses import dataclass
+from datetime import timedelta
 from typing import TYPE_CHECKING, Any
 from pydantic import BaseModel
@@ -26,16 +27,68 @@ class TextPredicate:
 @dataclass
 class JoinSpec:
-    kind: str
-    window: float
-    by: Callable[[Artifact], Any] | None = None
+    """
+    Specification for correlated AND gates.
+    Correlates artifacts by a common key within a time OR count window.
+    Examples:
+        # Time-based correlation (within 5 minutes)
+        JoinSpec(
+            by=lambda x: x.correlation_id,
+            within=timedelta(minutes=5)
+        )
+        # Count-based correlation (within next 10 artifacts)
+        JoinSpec(
+            by=lambda x: x.correlation_id,
+            within=10
+        )
+    Args:
+        by: Callable that extracts the correlation key from an artifact payload
+        within: Window for correlation
+            - timedelta: Time window (artifacts must arrive within this time)
+            - int: Count window (artifacts must arrive within N published artifacts)
+    """
+    by: Callable[[BaseModel], Any]  # Extract correlation key from payload
+    within: timedelta | int  # Time window OR count window for correlation
 @dataclass
 class BatchSpec:
-    size: int
-    within: float
-    by: Callable[[Artifact], Any] | None = None
+    """
+    Specification for batch processing.
+    Accumulates artifacts and triggers agent when:
+    - Size threshold reached (e.g., batch of 10)
+    - Timeout expires (e.g., flush every 30 seconds)
+    - Whichever comes first
+    Examples:
+        # Size-based batching (flush when 25 artifacts accumulated)
+        BatchSpec(size=25)
+        # Timeout-based batching (flush every 30 seconds)
+        BatchSpec(timeout=timedelta(seconds=30))
+        # Hybrid (whichever comes first)
+        BatchSpec(size=100, timeout=timedelta(minutes=5))
+    Args:
+        size: Optional batch size threshold (flush when this many artifacts accumulated)
+        timeout: Optional timeout threshold (flush when this much time elapsed since first artifact)
+    Note: At least one of size or timeout must be specified.
+    """
+    size: int | None = None
+    timeout: timedelta | None = None
+    def __post_init__(self):
+        if self.size is None and self.timeout is None:
+            raise ValueError("BatchSpec requires at least one of: size, timeout")
 class Subscription:
@@ -60,7 +113,17 @@ class Subscription:
             raise ValueError("Subscription must declare at least one type.")
         self.agent_name = agent_name
         self.type_models: list[type[BaseModel]] = list(types)
-        self.type_names: set[str] = {type_registry.register(t) for t in types}
+        # Register all types and build counts (supports duplicates for count-based AND gates)
+        type_name_list = [type_registry.register(t) for t in types]
+        self.type_names: set[str] = set(type_name_list)  # Unique type names (for matching)
+        # Count-based AND gate: Track how many of each type are required
+        # Example: .consumes(A, A, B) → {"TypeA": 2, "TypeB": 1}
+        self.type_counts: dict[str, int] = {}
+        for type_name in type_name_list:
+            self.type_counts[type_name] = self.type_counts.get(type_name, 0) + 1
         self.where = list(where or [])
         self.text_predicates = list(text_predicates or [])
         self.from_agents = set(from_agents or [])

{flock_core-0.5.2.dist-info → flock_core-0.5.3.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: flock-core
-Version: 0.5.2
+Version: 0.5.3
 Summary: Flock: A declrative framework for building and orchestrating AI agents.
 Author-email: Andre Ratzenberger <andre.ratzenberger@whiteduck.de>
 License: MIT
@@ -266,7 +266,7 @@ flock = Flock(os.getenv("DEFAULT_MODEL", "openai/gpt-4.1"))
 bug_detector = flock.agent("bug_detector").consumes(CodeSubmission).publishes(BugAnalysis)
 security_auditor = flock.agent("security_auditor").consumes(CodeSubmission).publishes(SecurityAnalysis)
-# This agent AUTOMATICALLY waits for both analyses
+# AND gate: This agent AUTOMATICALLY waits for BOTH analyses before triggering
 final_reviewer = flock.agent("final_reviewer").consumes(BugAnalysis, SecurityAnalysis).publishes(FinalReview)
 # 4. Run with real-time dashboard
@@ -343,29 +343,77 @@ analyzer = (
 )
 ```
-**Advanced subscriptions:**
+**Logic Operations (AND/OR Gates):**
+Flock provides intuitive syntax for coordinating multiple input types:
+```python
+# AND gate: Wait for BOTH types before triggering
+diagnostician = flock.agent("diagnostician").consumes(XRayAnalysis, LabResults).publishes(Diagnosis)
+# Agent triggers only when both XRayAnalysis AND LabResults are available
+# OR gate: Trigger on EITHER type (via chaining)
+alert_handler = flock.agent("alerts").consumes(SystemAlert).consumes(UserAlert).publishes(Response)
+# Agent triggers when SystemAlert OR UserAlert is published
+# Count-based AND gate: Wait for MULTIPLE instances of the same type
+aggregator = flock.agent("aggregator").consumes(Order, Order, Order).publishes(BatchSummary)
+# Agent triggers when THREE Order artifacts are available
+# Mixed counts: Different requirements per type
+validator = flock.agent("validator").consumes(Image, Image, Metadata).publishes(ValidationResult)
+# Agent triggers when TWO Images AND ONE Metadata are available
+```
+**What just happened:**
+- ✅ **Natural syntax** - Code clearly expresses intent ("wait for 3 orders")
+- ✅ **Order-independent** - Artifacts can arrive in any sequence
+- ✅ **Latest wins** - If 4 As arrive but need 3, uses the 3 most recent
+- ✅ **Zero configuration** - No manual coordination logic needed
+**Advanced subscriptions unlock crazy powerful patterns:**
 ```python
-# Conditional consumption - only high-severity cases
+# 🎯 Predicates - Smart filtering (only process critical cases)
 urgent_care = flock.agent("urgent").consumes(
     Diagnosis,
-    where=lambda d: d.severity in ["Critical", "High"]
+    where=lambda d: d.severity in ["Critical", "High"]  # Conditional routing!
 )
-# Batch processing - wait for 10 items
-batch_processor = flock.agent("batch").consumes(
-    Event,
-    batch=BatchSpec(size=10, timeout=timedelta(seconds=30))
+# 📦 BatchSpec - Cost optimization (process 10 at once = 90% cheaper API calls)
+payment_processor = flock.agent("payments").consumes(
+    Transaction,
+    batch=BatchSpec(size=25, timeout=timedelta(seconds=30))  # $5 saved per batch!
 )
-# Join operations - wait for multiple types within time window
-correlator = flock.agent("correlator").consumes(
-    SignalA,
-    SignalB,
-    join=JoinSpec(within=timedelta(minutes=5))
+# 🔗 JoinSpec - Data correlation (match orders + shipments by ID)
+customer_service = flock.agent("notifications").consumes(
+    Order,
+    Shipment,
+    join=JoinSpec(by=lambda x: x.order_id, within=timedelta(hours=24))  # Correlated!
+)
+# 🏭 Combined Features - Correlate sensors, THEN batch for analysis
+quality_control = flock.agent("qc").consumes(
+    TemperatureSensor,
+    PressureSensor,
+    join=JoinSpec(by=lambda x: x.device_id, within=timedelta(seconds=30)),
+    batch=BatchSpec(size=5, timeout=timedelta(seconds=45))  # IoT at scale!
 )
 ```
+**What just happened:**
+- ✅ **Predicates** route work by business rules ("only critical severity")
+- ✅ **BatchSpec** optimizes costs (25 transactions = 1 API call instead of 25)
+- ✅ **JoinSpec** correlates related data (orders ↔ shipments, sensors ↔ readings)
+- ✅ **Combined** delivers production-grade multi-stage pipelines
+**Real-world impact:**
+- 💰 E-commerce: Save $5 per batch on payment processing fees
+- 🏥 Healthcare: Correlate patient scans + lab results for diagnosis
+- 🏭 Manufacturing: Monitor 1000+ IoT sensors with efficient batching
+- 📊 Finance: Match trades + confirmations within 5-minute windows
 ### Visibility Controls (The Security)
 **Unlike other frameworks, Flock has zero-trust security built-in:**

{flock_core-0.5.2.dist-info → flock_core-0.5.3.dist-info}/RECORD RENAMED Viewed

@@ -1,15 +1,18 @@
 flock/__init__.py,sha256=fvp4ltfaAGmYliShuTY_XVIpOUN6bMXbWiBnwb1NBoM,310
-flock/agent.py,sha256=pYqVb1Z6BzIpM8kJoSl1XmirF8u7Gi0YIbUuGB0pcv4,41327
+flock/agent.py,sha256=vk15p1bw2YeTPAWLZHe2I6c558cAkZXi5DERbIL15kg,41808
+flock/artifact_collector.py,sha256=5aLgR_YSyMprWEiVA39JqpMue--N2vbpMICTWQX9b5A,6394
 flock/artifacts.py,sha256=3vQQ1J7QxTzeQBUGaNLiyojlmBv1NfdhFC98-qj8fpU,2541
+flock/batch_accumulator.py,sha256=b1DEQ1YUhwI9aG0frgFWCLlytsmYbpqG_-BoNe9emhk,8049
 flock/cli.py,sha256=lPtKxEXnGtyuTh0gyG3ixEIFS4Ty6Y0xsPd6SpUTD3U,4526
 flock/components.py,sha256=17vhNMHKc3VUruEbSdb9YNKcDziIe0coS9jpfWBmX4o,6259
+flock/correlation_engine.py,sha256=cDSCPDTIo-TuRYESMIqfKjs53avs7gPVdzZ_AfpH8a0,7999
 flock/examples.py,sha256=eQb8k6EYBbUhauFuSN_0EIIu5KW0mTqJU0HM4-p14sc,3632
-flock/orchestrator.py,sha256=f7FD1i2bcpkHEER0w3DEgzcWp1AmmBSbegVODdhYxdY,36661
+flock/orchestrator.py,sha256=O_4PdPZDyysZcOhzxKaFF1W0bp3SHtZonynTgHwSoxw,42786
 flock/registry.py,sha256=s0-H-TMtOsDZiZQCc7T1tYiWQg3OZHn5T--jaI_INIc,4786
 flock/runtime.py,sha256=UG-38u578h628mSddBmyZn2VIzFQ0wlHCpCALFiScqA,8518
 flock/service.py,sha256=JDdjjPTPH6NFezAr8x6svtqxIGXA7-AyHS11GF57g9Q,11041
 flock/store.py,sha256=H6z1_y5uDp_4UnHWqrxNksyoSGlzeVTgLY3Sv-guSTU,45793
-flock/subscription.py,sha256=ylIOV2G37KNfncdexrl4kxZOjo7SLS3LmddTaoSkrIk,3103
+flock/subscription.py,sha256=0fqjGVAr-3u1azSsXJ-xVjnUgSSYVO2a0Gd_zln2tZA,5422
 flock/utilities.py,sha256=bqTPnFF6E-pDqx1ISswDNEzTU2-ED_URlkyKWLjF3mU,12109
 flock/visibility.py,sha256=Cu2PMBjRtqjiWzlwHLCIC2AUFBjJ2augecG-jvK8ky0,2949
 flock/api/themes.py,sha256=BOj1e0LHx6BDLdnVdXh1LKsbQ_ZeubH9UCoj08dC1yc,1886
@@ -521,8 +524,8 @@ flock/themes/zenburned.toml,sha256=UEmquBbcAO3Zj652XKUwCsNoC2iQSlIh-q5c6DH-7Kc,1
 flock/themes/zenwritten-dark.toml,sha256=-dgaUfg1iCr5Dv4UEeHv_cN4GrPUCWAiHSxWK20X1kI,1663
 flock/themes/zenwritten-light.toml,sha256=G1iEheCPfBNsMTGaVpEVpDzYBHA_T-MV27rolUYolmE,1666
 flock/utility/output_utility_component.py,sha256=yVHhlIIIoYKziI5UyT_zvQb4G-NsxCTgLwA1wXXTTj4,9047
-flock_core-0.5.2.dist-info/METADATA,sha256=tCrSJS6TpMQftwK0xDIAmW3cK2-2r33WaM58tyvX4i0,36666
-flock_core-0.5.2.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
-flock_core-0.5.2.dist-info/entry_points.txt,sha256=UQdPmtHd97gSA_IdLt9MOd-1rrf_WO-qsQeIiHWVrp4,42
-flock_core-0.5.2.dist-info/licenses/LICENSE,sha256=U3IZuTbC0yLj7huwJdldLBipSOHF4cPf6cUOodFiaBE,1072
-flock_core-0.5.2.dist-info/RECORD,,
+flock_core-0.5.3.dist-info/METADATA,sha256=0Ec9QS5oTYf1t5r_FSpd3xAu3JXapC5FjHDP05GsRJA,39146
+flock_core-0.5.3.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
+flock_core-0.5.3.dist-info/entry_points.txt,sha256=UQdPmtHd97gSA_IdLt9MOd-1rrf_WO-qsQeIiHWVrp4,42
+flock_core-0.5.3.dist-info/licenses/LICENSE,sha256=U3IZuTbC0yLj7huwJdldLBipSOHF4cPf6cUOodFiaBE,1072
+flock_core-0.5.3.dist-info/RECORD,,

{flock_core-0.5.2.dist-info → flock_core-0.5.3.dist-info}/WHEEL RENAMED Viewed

File without changes

{flock_core-0.5.2.dist-info → flock_core-0.5.3.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{flock_core-0.5.2.dist-info → flock_core-0.5.3.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

flock-core 0.5.2__py3-none-any.whl → 0.5.3__py3-none-any.whl

Potentially problematic release.

flock-core 0.5.2py3-none-any.whl → 0.5.3py3-none-any.whl