PyPI - lionagi - Versions diffs - 0.13.6__py3-none-any.whl → 0.14.0__py3-none-any.whl - Mend

lionagi 0.13.6py3-none-any.whl → 0.14.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (23) hide show

lionagi/_types.py +1 -0
lionagi/fields/base.py +0 -1
lionagi/libs/concurrency/__init__.py +25 -0
lionagi/libs/concurrency/cancel.py +134 -0
lionagi/libs/concurrency/errors.py +35 -0
lionagi/libs/concurrency/patterns.py +252 -0
lionagi/libs/concurrency/primitives.py +242 -0
lionagi/libs/concurrency/task.py +109 -0
lionagi/operations/ReAct/ReAct.py +0 -2
lionagi/operations/ReAct/utils.py +1 -9
lionagi/operations/builder.py +46 -0
lionagi/operations/flow.py +292 -383
lionagi/operations/node.py +2 -1
lionagi/operations/operate/operate.py +0 -3
lionagi/protocols/graph/edge.py +1 -1
lionagi/session/branch.py +0 -4
lionagi/session/prompts.py +0 -1
lionagi/session/session.py +2 -2
lionagi/version.py +1 -1
{lionagi-0.13.6.dist-info → lionagi-0.14.0.dist-info}/METADATA +1 -1
{lionagi-0.13.6.dist-info → lionagi-0.14.0.dist-info}/RECORD +23 -17
{lionagi-0.13.6.dist-info → lionagi-0.14.0.dist-info}/WHEEL +0 -0
{lionagi-0.13.6.dist-info → lionagi-0.14.0.dist-info}/licenses/LICENSE +0 -0

lionagi/operations/flow.py CHANGED Viewed

@@ -2,421 +2,330 @@
 #
 # SPDX-License-Identifier: Apache-2.0
-import asyncio
-import contextlib
+"""
+Dependency-aware flow execution using structured concurrency primitives.
+Provides clean dependency management and context inheritance for operation graphs,
+using Events for synchronization and CapacityLimiter for concurrency control.
+"""
+import os
 from typing import Any
+from lionagi.libs.concurrency.primitives import CapacityLimiter
+from lionagi.libs.concurrency.primitives import Event as ConcurrencyEvent
+from lionagi.libs.concurrency.task import create_task_group
 from lionagi.operations.node import Operation
-from lionagi.operations.utils import prepare_session
-from lionagi.protocols.types import ID, Edge, Graph, Node
+from lionagi.protocols.types import EventStatus, Graph
 from lionagi.session.branch import Branch
 from lionagi.session.session import Session
 from lionagi.utils import to_dict
+# Maximum concurrency when None is specified (effectively unlimited)
+UNLIMITED_CONCURRENCY = int(os.environ.get("LIONAGI_MAX_CONCURRENCY", "10000"))
+class DependencyAwareExecutor:
+    """Executes operation graphs with dependency management and context inheritance."""
+    def __init__(
+        self,
+        session: Session,
+        graph: Graph,
+        context: dict[str, Any] | None = None,
+        max_concurrent: int = 5,
+        verbose: bool = False,
+        default_branch: Branch | None = None,
+    ):
+        """Initialize the executor.
+        Args:
+            session: The session for branch management
+            graph: The operation graph to execute
+            context: Initial execution context
+            max_concurrent: Maximum concurrent operations
+            verbose: Enable verbose logging
+            default_branch: Optional default branch for operations
+        """
+        self.session = session
+        self.graph = graph
+        self.context = context or {}
+        self.max_concurrent = max_concurrent
+        self.verbose = verbose
+        self._default_branch = default_branch
+        # Track results and completion
+        self.results = {}
+        self.completion_events = {}  # operation_id -> Event
+        self.operation_branches = {}  # operation_id -> Branch
+        # Initialize completion events for all operations
+        for node in graph.internal_nodes.values():
+            if isinstance(node, Operation):
+                self.completion_events[node.id] = ConcurrencyEvent()
+    async def execute(self) -> dict[str, Any]:
+        """Execute the operation graph."""
+        if not self.graph.is_acyclic():
+            raise ValueError("Graph must be acyclic for flow execution")
+        # Create capacity limiter for concurrency control
+        # None means no limit, use the configured unlimited value
+        capacity = (
+            self.max_concurrent
+            if self.max_concurrent is not None
+            else UNLIMITED_CONCURRENCY
+        )
+        limiter = CapacityLimiter(capacity)
+        # Execute all operations using structured concurrency
+        async with create_task_group() as tg:
+            for node in self.graph.internal_nodes.values():
+                if isinstance(node, Operation):
+                    await tg.start_soon(self._execute_operation, node, limiter)
+        # Return results
+        return {
+            "completed_operations": list(self.results.keys()),
+            "operation_results": self.results,
+            "final_context": self.context,
+        }
+    async def _execute_operation(
+        self, operation: Operation, limiter: CapacityLimiter
+    ):
+        """Execute a single operation with dependency waiting."""
+        try:
+            # Wait for dependencies
+            await self._wait_for_dependencies(operation)
+            # Acquire capacity to limit concurrency
+            async with limiter:
+                # Prepare operation context
+                await self._prepare_operation(operation)
+                # Execute the operation
+                if self.verbose:
+                    print(f"Executing operation: {str(operation.id)[:8]}")
+                branch = self.operation_branches.get(
+                    operation.id, self.session.default_branch
+                )
+                operation.execution.status = EventStatus.PROCESSING
-async def flow(
-    branch: Branch,
-    graph: Graph,
-    *,
-    context: dict[str, Any] | None = None,
-    parallel: bool = True,
-    max_concurrent: int = 5,
-    verbose: bool = False,
-    session: Session | None = None,
-) -> dict[str, Any]:
-    """
-    Execute a graph-based workflow using the branch's operations.
-    For simple graphs, executes directly on the branch.
-    For parallel execution, uses session for coordination.
-    Args:
-        branch: The branch to execute operations on
-        graph: The workflow graph containing Operation nodes
-        context: Initial context
-        parallel: Whether to execute independent operations in parallel
-        max_concurrent: Max concurrent operations
-        verbose: Enable verbose logging
-        session: Optional session for multi-branch parallel execution
-    Returns:
-        Execution results with completed operations and final context
-    """
-    # Validate graph
-    if not graph.is_acyclic():
-        raise ValueError("Graph must be acyclic for flow execution")
-    session, branch = prepare_session(session, branch)
-    if not parallel or max_concurrent == 1:
-        return await _execute_sequential(branch, graph, context, verbose)
-    return await _execute_parallel(
-        session, graph, context, max_concurrent, verbose
-    )
-async def _execute_sequential(
-    branch: Branch, graph: Graph, context: dict[str, Any] | None, verbose: bool
-) -> dict[str, Any]:
-    """Execute graph sequentially on a single branch."""
-    completed = []
-    results = {}
-    execution_context = context or {}
-    # Get execution order (topological sort)
-    execution_order = _topological_sort(graph)
+                await operation.invoke(branch)
-    for node_id in execution_order:
-        node = graph.internal_nodes[node_id]
+                # Store results
+                self.results[operation.id] = operation.response
+                operation.execution.status = EventStatus.COMPLETED
-        if not isinstance(node, Operation):
-            continue
+                # Update context if response contains context
+                if (
+                    isinstance(operation.response, dict)
+                    and "context" in operation.response
+                ):
+                    self.context.update(operation.response["context"])
+                if self.verbose:
+                    print(f"Completed operation: {str(operation.id)[:8]}")
+        except Exception as e:
+            operation.execution.status = EventStatus.FAILED
+            operation.execution.error = str(e)
+            self.results[operation.id] = {"error": str(e)}
+            if self.verbose:
+                print(f"Operation {str(operation.id)[:8]} failed: {e}")
+        finally:
+            # Signal completion regardless of success/failure
+            self.completion_events[operation.id].set()
+    async def _wait_for_dependencies(self, operation: Operation):
+        """Wait for all dependencies to complete."""
+        # Special handling for aggregations
+        if operation.metadata.get("aggregation"):
+            sources = operation.parameters.get("aggregation_sources", [])
+            if self.verbose and sources:
+                print(
+                    f"Aggregation {str(operation.id)[:8]} waiting for {len(sources)} sources"
+                )
-        # Check dependencies using set for fast lookup
-        completed_set = set(completed)
+            # Wait for ALL sources
+            for source_id in sources:
+                if source_id in self.completion_events:
+                    await self.completion_events[source_id].wait()
-        # Check if dependencies and conditions are satisfied
-        if not await _dependencies_satisfied_async(
-            node, graph, completed_set, results, execution_context
-        ):
-            continue
+        # Regular dependency checking
+        predecessors = self.graph.get_predecessors(operation)
+        for pred in predecessors:
+            if self.verbose:
+                print(
+                    f"Operation {str(operation.id)[:8]} waiting for {str(pred.id)[:8]}"
+                )
+            await self.completion_events[pred.id].wait()
+        # Check edge conditions
+        incoming_edges = [
+            edge
+            for edge in self.graph.internal_edges.values()
+            if edge.tail == operation.id
+        ]
+        for edge in incoming_edges:
+            # Wait for head to complete
+            if edge.head in self.completion_events:
+                await self.completion_events[edge.head].wait()
+            # Evaluate edge condition
+            if edge.condition is not None:
+                result_value = self.results.get(edge.head)
+                if result_value is not None and not isinstance(
+                    result_value, (str, int, float, bool)
+                ):
+                    result_value = to_dict(result_value, recursive=True)
-        predecessors = graph.get_predecessors(node)
+                ctx = {"result": result_value, "context": self.context}
+                if not await edge.condition.apply(ctx):
+                    raise ValueError(
+                        f"Edge condition not satisfied for {str(operation.id)[:8]}"
+                    )
+    async def _prepare_operation(self, operation: Operation):
+        """Prepare operation with context and branch assignment."""
         # Update operation context with predecessors
+        predecessors = self.graph.get_predecessors(operation)
         if predecessors:
             pred_context = {}
             for pred in predecessors:
-                if pred.id in results:
-                    result = results[pred.id]
-                # Use to_dict for proper serialization of complex types only
-                if result is not None and not isinstance(
-                    result, (str, int, float, bool)
-                ):
-                    result = to_dict(result, recursive=True)
-                pred_context[f"{pred.id}_result"] = result
+                if pred.id in self.results:
+                    result = self.results[pred.id]
+                    if result is not None and not isinstance(
+                        result, (str, int, float, bool)
+                    ):
+                        result = to_dict(result, recursive=True)
+                    pred_context[f"{pred.id}_result"] = result
-            if "context" not in node.parameters:
-                node.parameters["context"] = pred_context
+            if "context" not in operation.parameters:
+                operation.parameters["context"] = pred_context
             else:
-                node.parameters["context"].update(pred_context)
+                operation.parameters["context"].update(pred_context)
         # Add execution context
-        if execution_context:
-            if "context" not in node.parameters:
-                node.parameters["context"] = execution_context.copy()
+        if self.context:
+            if "context" not in operation.parameters:
+                operation.parameters["context"] = self.context.copy()
             else:
-                node.parameters["context"].update(execution_context)
-        # Execute operation
-        if verbose:
-            print(f"Executing operation: {node.id}")
-        await node.invoke(branch)
-        completed.append(node.id)
-        results[node.id] = node.response
-        # Update execution context
-        if isinstance(node.response, dict) and "context" in node.response:
-            execution_context.update(node.response["context"])
-    return {
-        "completed_operations": completed,
-        "operation_results": results,
-        "final_context": execution_context,
-    }
-async def _execute_parallel(
-    session: Session,
-    graph: Graph,
-    context: dict[str, Any] | None,
-    max_concurrent: int,
-    verbose: bool,
-) -> dict[str, Any]:
-    """Execute graph in parallel using multiple branches."""
-    results = {}
-    execution_context = context or {}
-    completed = []  # Track completed operations
-    # Get operation nodes in topological order
-    operation_nodes = []
-    execution_order = _topological_sort(graph)
-    for node_id in execution_order:
-        node = graph.internal_nodes.get(node_id)
-        if isinstance(node, Operation):
-            operation_nodes.append(node)
-    # Use session branches context manager for safe parallel execution
-    async with session.branches:
-        # Create a pool of worker branches
-        worker_branches = []
-        for i in range(min(max_concurrent, len(operation_nodes))):
-            if i == 0:
-                worker_branches.append(session.default_branch)
-            else:
-                worker_branches.append(session.split(session.default_branch))
-        # Process nodes in dependency order
-        remaining_nodes = {node.id for node in operation_nodes}
-        executing_tasks: dict[ID[Operation], asyncio.Task] = {}
-        blocked_nodes = set()  # Nodes that have been checked and found blocked
-        max_iterations = 1000  # Prevent infinite loops
-        iteration = 0
-        while (
-            remaining_nodes or executing_tasks
-        ) and iteration < max_iterations:
-            iteration += 1
-            # Check for completed tasks
-            completed_in_round = []
-            for node_id, task in list(executing_tasks.items()):
-                if task.done():
-                    try:
-                        result = await task
-                        results[node_id] = result
-                        completed.append(node_id)
-                        completed_in_round.append(node_id)
-                        if verbose:
-                            print(f"Completed operation: {node_id}")
-                    except Exception as e:
-                        if verbose:
-                            print(f"Operation {node_id} failed: {e}")
-                        results[node_id] = {"error": str(e)}
-                        completed.append(node_id)
-                        completed_in_round.append(node_id)
-                    finally:
-                        del executing_tasks[node_id]
-            # Remove completed from remaining
-            remaining_nodes -= set(completed_in_round)
-            # If new completions, clear blocked nodes to re-check
-            if completed_in_round:
-                blocked_nodes.clear()
-            # Find nodes ready to execute (skip already blocked nodes)
-            ready_nodes = []
-            completed_set = set(completed)
-            newly_blocked = []
-            for node in operation_nodes:
-                if (
-                    node.id in remaining_nodes
-                    and node.id not in executing_tasks
-                    and node.id not in blocked_nodes
-                    and len(executing_tasks) < max_concurrent
-                ):
-                    if await _dependencies_satisfied_async(
-                        node, graph, completed_set, results, execution_context
+                operation.parameters["context"].update(self.context)
+        # Determine and assign branch
+        branch = await self._resolve_branch_for_operation(operation)
+        self.operation_branches[operation.id] = branch
+    async def _resolve_branch_for_operation(
+        self, operation: Operation
+    ) -> Branch:
+        """Resolve which branch an operation should use based on inheritance rules."""
+        # Check if operation has an explicit branch_id
+        if operation.branch_id:
+            try:
+                return self.session.branches[operation.branch_id]
+            except:
+                pass
+        # Get predecessors for context inheritance check
+        predecessors = self.graph.get_predecessors(operation)
+        # Handle context inheritance
+        if operation.metadata.get("inherit_context"):
+            primary_dep_id = operation.metadata.get("primary_dependency")
+            if primary_dep_id and primary_dep_id in self.results:
+                # Find the operation that was the primary dependency
+                for node in self.graph.internal_nodes.values():
+                    if (
+                        isinstance(node, Operation)
+                        and node.id == primary_dep_id
+                        and node.branch_id
                     ):
-                        ready_nodes.append(node)
-                    else:
-                        newly_blocked.append(node.id)
-            # Update blocked nodes
-            blocked_nodes.update(newly_blocked)
-            # If no ready nodes but we have remaining and no executing tasks, we're stuck
-            if not ready_nodes and remaining_nodes and not executing_tasks:
-                if verbose:
-                    print(
-                        f"Deadlock detected: {len(remaining_nodes)} nodes cannot execute"
-                    )
-                    remaining_node_names = [
-                        n.operation
-                        for n in operation_nodes
-                        if n.id in remaining_nodes
-                    ]
-                    print(f"Remaining operations: {remaining_node_names}")
-                # Mark remaining nodes as failed
-                for node in operation_nodes:
-                    if node.id in remaining_nodes:
-                        results[node.id] = {
-                            "error": "Blocked by unsatisfied conditions"
-                        }
-                        completed.append(node.id)
-                break
-            # Start execution for ready nodes
-            started_count = 0
-            for node in ready_nodes:
-                if len(executing_tasks) >= max_concurrent:
-                    break
-                # Get an available branch (round-robin)
-                branch_idx = len(executing_tasks) % len(worker_branches)
-                node_branch = worker_branches[branch_idx]
-                # Check if node specifies a branch
-                branch_id = node.parameters.get("branch_id")
-                if branch_id:
-                    try:
-                        node_branch = session.branches[branch_id]
-                    except:
-                        pass  # Use the selected worker branch
-                # Create task for this node
-                task = asyncio.create_task(
-                    _execute_node_async(
-                        node,
-                        node_branch,
-                        graph,
-                        results,
-                        execution_context,
-                        verbose,
-                    )
-                )
-                executing_tasks[node.id] = task
-                started_count += 1
-                if verbose:
-                    branch_name = (
-                        getattr(node_branch, "name", None) or node_branch.id
+                        try:
+                            primary_branch = self.session.branches[
+                                node.branch_id
+                            ]
+                            # Use session.branches context manager for split
+                            async with self.session.branches:
+                                split_branch = self.session.split(
+                                    primary_branch
+                                )
+                            if self.verbose:
+                                print(
+                                    f"Operation {str(operation.id)[:8]} inheriting context from {str(primary_dep_id)[:8]}"
+                                )
+                            return split_branch
+                        except:
+                            pass
+        # If operation has dependencies but no inheritance, create fresh branch
+        elif predecessors:
+            try:
+                async with self.session.branches:
+                    fresh_branch = self.session.split(
+                        self.session.default_branch
                     )
+                if self.verbose:
                     print(
-                        f"Started operation {node.id} on branch: {branch_name}"
+                        f"Operation {str(operation.id)[:8]} starting with fresh context"
                     )
+                return fresh_branch
+            except:
+                pass
-            # If we started new tasks or have executing tasks, wait for some to complete
-            if started_count > 0 or executing_tasks:
-                # Wait for at least one task to complete before next iteration
-                if executing_tasks:
-                    done, pending = await asyncio.wait(
-                        executing_tasks.values(),
-                        return_when=asyncio.FIRST_COMPLETED,
-                    )
-                else:
-                    await asyncio.sleep(0.01)
-            elif not remaining_nodes:
-                # All done
-                break
-        if iteration >= max_iterations:
-            raise RuntimeError(
-                f"Flow execution exceeded maximum iterations ({max_iterations})"
-            )
-    return {
-        "completed_operations": completed,
-        "operation_results": results,
-        "final_context": execution_context,
-    }
-async def _execute_node_async(
-    node: Operation,
-    branch: Branch,
-    graph: Graph,
-    results: dict[str, Any],
-    execution_context: dict[str, Any],
-    verbose: bool,
-) -> Any:
-    """Execute a single node asynchronously."""
-    # Update operation context with predecessors
-    predecessors = graph.get_predecessors(node)
-    if predecessors:
-        pred_context = {}
-        for pred in predecessors:
-            if pred.id in results:
-                result = results[pred.id]
-                # Use to_dict for proper serialization of complex types only
-                if result is not None and not isinstance(
-                    result, (str, int, float, bool)
-                ):
-                    result = to_dict(result, recursive=True)
-                pred_context[f"{pred.id}_result"] = result
-        if "context" not in node.parameters:
-            node.parameters["context"] = pred_context
-        else:
-            node.parameters["context"].update(pred_context)
-    # Add execution context
-    if execution_context:
-        if "context" not in node.parameters:
-            node.parameters["context"] = execution_context.copy()
-        else:
-            node.parameters["context"].update(execution_context)
-    # Execute the operation
-    await node.invoke(branch)
-    result = node.response
-    # Update execution context if needed
-    if isinstance(result, dict) and "context" in result:
-        execution_context.update(result["context"])
+        # Default to session's default branch or the provided branch
+        if hasattr(self, "_default_branch") and self._default_branch:
+            return self._default_branch
+        return self.session.default_branch
-    return result
+async def flow(
+    session: Session,
+    graph: Graph,
+    *,
+    branch: Branch | None = None,
+    context: dict[str, Any] | None = None,
+    parallel: bool = True,
+    max_concurrent: int = None,
+    verbose: bool = False,
+) -> dict[str, Any]:
+    """Execute a graph using structured concurrency primitives.
-def _topological_sort(graph: Graph) -> list[str]:
-    """Get topological ordering of graph nodes."""
-    visited = set()
-    stack = []
-    def visit(node_id: str):
-        if node_id in visited:
-            return
-        visited.add(node_id)
-        successors = graph.get_successors(graph.internal_nodes[node_id])
-        for successor in successors:
-            visit(successor.id)
-        stack.append(node_id)
+    This provides clean dependency management and context inheritance
+    using Events and CapacityLimiter for proper coordination.
-    for node in graph.internal_nodes:
-        if node.id not in visited:
-            visit(node.id)
+    Args:
+        session: Session for branch management and multi-branch execution
+        graph: The workflow graph containing Operation nodes
+        branch: Optional specific branch to use for single-branch operations
+        context: Initial context
+        parallel: Whether to execute independent operations in parallel
+        max_concurrent: Max concurrent operations (1 if not parallel)
+        verbose: Enable verbose logging
-    return stack[::-1]
+    Returns:
+        Execution results with completed operations and final context
+    """
+    # Handle concurrency limits
+    if not parallel:
+        max_concurrent = 1  # Force sequential execution
+    # If max_concurrent is None, it means no limit
+    # Execute using the dependency-aware executor
+    executor = DependencyAwareExecutor(
+        session=session,
+        graph=graph,
+        context=context,
+        max_concurrent=max_concurrent,
+        verbose=verbose,
+        default_branch=branch,
+    )
-async def _dependencies_satisfied_async(
-    node: Node,
-    graph: Graph,
-    completed: set[str],
-    results: dict[str, Any],
-    execution_context: dict[str, Any] | None = None,
-) -> bool:
-    """Check if node dependencies are satisfied and edge conditions pass."""
-    # Get all incoming edges to this node
-    incoming_edges: list[Edge] = []
-    for edge in graph.internal_edges:
-        if edge.tail == node.id:
-            incoming_edges.append(edge)
-    # If no incoming edges, node can execute
-    if not incoming_edges:
-        return True
-    # Check each incoming edge
-    at_least_one_satisfied = False
-    for edge in incoming_edges:
-        # Check if predecessor is completed
-        if edge.head not in completed:
-            continue
-        # Predecessor is completed
-        if edge.condition:
-            # Evaluate condition
-            # Get the result - don't use to_dict if it's already a simple type
-            result_value = results.get(edge.head)
-            if result_value is not None and not isinstance(
-                result_value, (str, int, float, bool)
-            ):
-                result_value = to_dict(result_value, recursive=True)
-            ctx = {"result": result_value, "context": execution_context or {}}
-            with contextlib.suppress(Exception):
-                if await edge.condition.apply(ctx):
-                    at_least_one_satisfied = True
-        else:
-            # No condition, edge is satisfied
-            at_least_one_satisfied = True
-    return at_least_one_satisfied
+    return await executor.execute()

lionagi 0.13.6__py3-none-any.whl → 0.14.0__py3-none-any.whl

lionagi 0.13.6py3-none-any.whl → 0.14.0py3-none-any.whl