PyPI - lionagi - Versions diffs - 0.15.14__py3-none-any.whl → 0.16.0__py3-none-any.whl - Mend

lionagi 0.15.14py3-none-any.whl → 0.16.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (39) hide show

lionagi/libs/validate/fuzzy_match_keys.py +5 -182
lionagi/libs/validate/string_similarity.py +6 -331
lionagi/ln/__init__.py +56 -66
lionagi/ln/_async_call.py +13 -10
lionagi/ln/_hash.py +33 -8
lionagi/ln/_list_call.py +2 -35
lionagi/ln/_to_list.py +51 -28
lionagi/ln/_utils.py +156 -0
lionagi/ln/concurrency/__init__.py +39 -31
lionagi/ln/concurrency/_compat.py +65 -0
lionagi/ln/concurrency/cancel.py +92 -109
lionagi/ln/concurrency/errors.py +17 -17
lionagi/ln/concurrency/patterns.py +249 -206
lionagi/ln/concurrency/primitives.py +257 -216
lionagi/ln/concurrency/resource_tracker.py +42 -155
lionagi/ln/concurrency/task.py +55 -73
lionagi/ln/concurrency/throttle.py +3 -0
lionagi/ln/concurrency/utils.py +1 -0
lionagi/ln/fuzzy/__init__.py +15 -0
lionagi/ln/{_extract_json.py → fuzzy/_extract_json.py} +22 -9
lionagi/ln/{_fuzzy_json.py → fuzzy/_fuzzy_json.py} +14 -8
lionagi/ln/fuzzy/_fuzzy_match.py +172 -0
lionagi/ln/fuzzy/_fuzzy_validate.py +46 -0
lionagi/ln/fuzzy/_string_similarity.py +332 -0
lionagi/ln/{_models.py → types.py} +153 -4
lionagi/operations/flow.py +2 -1
lionagi/operations/operate/operate.py +26 -16
lionagi/protocols/contracts.py +46 -0
lionagi/protocols/generic/event.py +6 -6
lionagi/protocols/generic/processor.py +9 -5
lionagi/protocols/ids.py +82 -0
lionagi/protocols/types.py +10 -12
lionagi/utils.py +34 -64
lionagi/version.py +1 -1
{lionagi-0.15.14.dist-info → lionagi-0.16.0.dist-info}/METADATA +4 -2
{lionagi-0.15.14.dist-info → lionagi-0.16.0.dist-info}/RECORD +38 -31
lionagi/ln/_types.py +0 -146
{lionagi-0.15.14.dist-info → lionagi-0.16.0.dist-info}/WHEEL +0 -0
{lionagi-0.15.14.dist-info → lionagi-0.16.0.dist-info}/licenses/LICENSE +0 -0

lionagi/ln/concurrency/patterns.py CHANGED Viewed

@@ -1,259 +1,302 @@
-"""Common concurrency patterns for structured concurrency."""
+"""Lion Async Concurrency Patterns - Structured concurrency coordination utilities.
+This module provides async coordination patterns built on AnyIO's structured
+concurrency primitives. All patterns are backend-neutral (asyncio/trio).
+Key Features:
+- gather: Concurrent execution with fail-fast or exception collection
+- race: First-to-complete coordination
+- bounded_map: Concurrent mapping with rate limiting
+- CompletionStream: Stream results as they become available
+- retry: Deadline-aware exponential backoff
+Note on Structural Concurrency:
+These patterns follow structured concurrency principles where possible. In
+particular, CompletionStream provides an explicit lifecycle to avoid the
+pitfalls of unstructured as_completed-like patterns when breaking early.
+See individual function docstrings for details.
+"""
 from __future__ import annotations
-import logging
-from collections.abc import Awaitable, Callable
-from types import TracebackType
-from typing import Any, TypeVar
+from collections.abc import Awaitable, Callable, Iterable, Sequence
+from typing import TypeVar
 import anyio
-from .cancel import move_on_after
-from .primitives import CapacityLimiter, Lock
-from .resource_tracker import track_resource, untrack_resource
+from ._compat import ExceptionGroup
+from .cancel import effective_deadline
+from .errors import is_cancelled
+from .primitives import CapacityLimiter
 from .task import create_task_group
-logger = logging.getLogger(__name__)
 T = TypeVar("T")
 R = TypeVar("R")
-Response = TypeVar("Response")
-class ConnectionPool:
-    """A pool of reusable connections."""
+__all__ = (
+    "gather",
+    "race",
+    "bounded_map",
+    "CompletionStream",
+    "retry",
+)
-    def __init__(
-        self,
-        max_connections: int,
-        connection_factory: Callable[[], Awaitable[T]],
-    ):
-        """Initialize a new connection pool."""
-        if max_connections < 1:
-            raise ValueError("max_connections must be >= 1")
-        if not callable(connection_factory):
-            raise ValueError("connection_factory must be callable")
-        self._connection_factory = connection_factory
-        self._limiter = CapacityLimiter(max_connections)
-        self._connections: list[T] = []
-        self._lock = Lock()
+async def gather(
+    *aws: Awaitable[T], return_exceptions: bool = False
+) -> list[T | BaseException]:
+    """Run awaitables concurrently, return list of results.
-        track_resource(self, f"ConnectionPool-{id(self)}", "ConnectionPool")
+    Args:
+        *aws: Awaitables to execute concurrently
+        return_exceptions: If True, exceptions are returned as results
+                           If False, first exception cancels all tasks and re-raises
-    def __del__(self):
-        """Clean up resource tracking."""
-        try:
-            untrack_resource(self)
-        except Exception:
-            pass
+    Returns:
+        List of results in same order as input awaitables
+    """
+    if not aws:
+        return []
-    async def acquire(self) -> T:
-        """Acquire a connection from the pool."""
-        await self._limiter.acquire()
+    results: list[T | BaseException | None] = [None] * len(aws)
+    async def _runner(idx: int, aw: Awaitable[T]) -> None:
         try:
-            async with self._lock:
-                if self._connections:
-                    return self._connections.pop()
-            # No pooled connection available, create new one
-            return await self._connection_factory()
-        except Exception:
-            self._limiter.release()
-            raise
+            results[idx] = await aw
+        except BaseException as exc:
+            results[idx] = exc
+            if not return_exceptions:
+                raise  # Propagate to the TaskGroup
-    async def release(self, connection: T) -> None:
-        """Release a connection back to the pool."""
-        try:
-            async with self._lock:
-                self._connections.append(connection)
-        finally:
-            self._limiter.release()
+    try:
+        async with create_task_group() as tg:
+            for i, aw in enumerate(aws):
+                tg.start_soon(_runner, i, aw)
+    except ExceptionGroup as eg:
+        if not return_exceptions:
+            # Find the first "real" exception and raise it.
+            non_cancel_excs = [e for e in eg.exceptions if not is_cancelled(e)]
+            if non_cancel_excs:
+                raise non_cancel_excs[0]
+            raise  # Re-raise group if all were cancellations
-    async def __aenter__(self) -> ConnectionPool[T]:
-        """Enter the connection pool context."""
-        return self
+    return results  # type: ignore
+async def race(*aws: Awaitable[T]) -> T:
+    """Run awaitables concurrently, return result of first completion.
-    async def __aexit__(
-        self,
-        exc_type: type[BaseException] | None,
-        exc_val: BaseException | None,
-        exc_tb: TracebackType | None,
-    ) -> None:
-        """Exit the connection pool context."""
-        # Clean up any remaining connections
-        async with self._lock:
-            self._connections.clear()
-async def parallel_requests(
-    inputs: list[str],
-    func: Callable[[str], Awaitable[Response]],
-    max_concurrency: int = 10,
-) -> list[Response]:
-    """Execute requests in parallel with controlled concurrency.
+    Returns the first result to complete, whether success or failure.
+    All other tasks are cancelled when first task completes.
+    If first completion is an exception, it's re-raised.
+    Note: This returns first *completion*, not first *success*.
+    For first-success semantics, consider implementing a first_success variant.
+    """
+    if not aws:
+        raise ValueError("race() requires at least one awaitable")
+    send, recv = anyio.create_memory_object_stream(0)
+    async def _runner(aw: Awaitable[T]) -> None:
+        try:
+            res = await aw
+            await send.send((True, res))
+        except BaseException as exc:
+            await send.send((False, exc))
+    async with send, recv, create_task_group() as tg:
+        for aw in aws:
+            tg.start_soon(_runner, aw)
+        ok, payload = await recv.receive()
+        tg.cancel_scope.cancel()
+    # Raise outside the TaskGroup context to avoid ExceptionGroup wrapping
+    if ok:
+        return payload  # type: ignore[return-value]
+    raise payload  # type: ignore[misc]
+async def bounded_map(
+    func: Callable[[T], Awaitable[R]],
+    items: Iterable[T],
+    *,
+    limit: int,
+    return_exceptions: bool = False,
+) -> list[R | BaseException]:
+    """Apply async function to items with concurrency limit.
     Args:
-        inputs: List of inputs
-        fetch_func: Async function
-        max_concurrency: Maximum number of concurrent requests
+        func: Async function to apply to each item
+        items: Items to process
+        limit: Maximum concurrent operations
+        return_exceptions: If True, exceptions are returned as results.
+                           If False, first exception cancels all tasks and re-raises.
     Returns:
-        List of responses in the same order as inputs
+        List of results in same order as input items.
+        If return_exceptions is True, exceptions are included in results.
     """
-    if not inputs:
+    if limit <= 0:
+        raise ValueError("limit must be >= 1")
+    seq = list(items)
+    if not seq:
         return []
-    results: list[Response | None] = [None] * len(inputs)
+    out: list[R | BaseException | None] = [None] * len(seq)
+    limiter = CapacityLimiter(limit)
-    async def bounded_fetch(
-        semaphore: anyio.Semaphore, idx: int, url: str
-    ) -> None:
-        async with semaphore:
-            results[idx] = await func(url)
+    async def _runner(i: int, x: T) -> None:
+        async with limiter:
+            try:
+                out[i] = await func(x)
+            except BaseException as exc:
+                out[i] = exc
+                if not return_exceptions:
+                    raise  # Propagate to the TaskGroup
     try:
         async with create_task_group() as tg:
-            semaphore = anyio.Semaphore(max_concurrency)
-            for i, inp in enumerate(inputs):
-                await tg.start_soon(bounded_fetch, semaphore, i, inp)
-    except BaseException as e:
-        # Re-raise the first exception directly instead of ExceptionGroup
-        if hasattr(e, "exceptions") and e.exceptions:
-            raise e.exceptions[0]
-        else:
+            for i, x in enumerate(seq):
+                tg.start_soon(_runner, i, x)
+    except ExceptionGroup as eg:
+        if not return_exceptions:
+            non_cancel_excs = [e for e in eg.exceptions if not is_cancelled(e)]
+            if non_cancel_excs:
+                raise non_cancel_excs[0]
             raise
-    return results  # type: ignore
+    return out  # type: ignore
-async def retry_with_timeout(
-    func: Callable[[], Awaitable[T]],
-    max_retries: int = 3,
-    timeout: float = 30.0,
-    backoff_factor: float = 1.0,
-) -> T:
-    """Retry an async function with exponential backoff and timeout.
-    Args:
-        func: The async function to retry
-        max_retries: Maximum number of retries
-        timeout: Timeout for each attempt
-        backoff_factor: Multiplier for exponential backoff
+class CompletionStream:
+    """Structured-concurrency-safe completion stream with explicit lifecycle management.
-    Returns:
-        The result of the successful function call
+    This provides a safer alternative to as_completed() that allows explicit cancellation
+    of remaining tasks when early termination is needed.
-    Raises:
-        Exception: The last exception raised by the function
+    Usage:
+        async with CompletionStream(awaitables, limit=10) as stream:
+            async for index, result in stream:
+                if some_condition:
+                    break  # Remaining tasks are automatically cancelled
     """
-    last_exception = None
-    for attempt in range(max_retries):
-        try:
-            with move_on_after(timeout) as cancel_scope:
-                result = await func()
-                if not cancel_scope.cancelled_caught:
-                    return result
-                else:
-                    raise TimeoutError(f"Function timed out after {timeout}s")
-        except Exception as e:
-            last_exception = e
-            if attempt < max_retries - 1:
-                delay = backoff_factor * (2**attempt)
-                await anyio.sleep(delay)
-            continue
-    if last_exception:
-        raise last_exception
-    else:
-        raise RuntimeError("Retry failed without capturing exception")
-class WorkerPool:
-    """A pool of worker tasks that process items from a queue."""
     def __init__(
-        self, num_workers: int, worker_func: Callable[[Any], Awaitable[None]]
+        self, aws: Sequence[Awaitable[T]], *, limit: int | None = None
     ):
-        """Initialize a new worker pool."""
-        if num_workers < 1:
-            raise ValueError("num_workers must be >= 1")
-        if not callable(worker_func):
-            raise ValueError("worker_func must be callable")
-        self._num_workers = num_workers
-        self._worker_func = worker_func
-        self._queue = anyio.create_memory_object_stream(1000)
+        self.aws = aws
+        self.limit = limit
         self._task_group = None
+        self._send = None
+        self._recv = None
+        self._completed_count = 0
+        self._total_count = len(aws)
+    async def __aenter__(self):
+        n = len(self.aws)
+        self._send, self._recv = anyio.create_memory_object_stream(n)
+        self._task_group = anyio.create_task_group()
+        await self._task_group.__aenter__()
-        track_resource(self, f"WorkerPool-{id(self)}", "WorkerPool")
-    def __del__(self):
-        """Clean up resource tracking."""
-        try:
-            untrack_resource(self)
-        except Exception:
-            pass
+        limiter = CapacityLimiter(self.limit) if self.limit else None
-    async def start(self) -> None:
-        """Start the worker pool."""
-        if self._task_group is not None:
-            raise RuntimeError("Worker pool is already started")
+        async def _runner(i: int, aw: Awaitable[T]) -> None:
+            if limiter:
+                await limiter.acquire()
+            try:
+                res = await aw
+                await self._send.send((i, res))
+            finally:
+                if limiter:
+                    limiter.release()
-        self._task_group = create_task_group()
-        await self._task_group.__aenter__()
+        # Start all tasks
+        for i, aw in enumerate(self.aws):
+            self._task_group.start_soon(_runner, i, aw)
-        # Start worker tasks
-        for i in range(self._num_workers):
-            await self._task_group.start_soon(self._worker_loop)
+        return self
-    async def stop(self) -> None:
-        """Stop the worker pool."""
-        if self._task_group is None:
-            return
+    async def __aexit__(self, exc_type, exc_val, exc_tb):
+        # Cancel remaining tasks and clean up
+        if self._task_group:
+            await self._task_group.__aexit__(exc_type, exc_val, exc_tb)
+        if self._send:
+            await self._send.aclose()
+        if self._recv:
+            await self._recv.aclose()
+        return False
+    def __aiter__(self):
+        if not self._recv:
+            raise RuntimeError(
+                "CompletionStream must be used as async context manager"
+            )
+        return self
-        # Close the queue to signal workers to stop
-        await self._queue[0].aclose()
+    async def __anext__(self):
+        if self._completed_count >= self._total_count:
+            raise StopAsyncIteration
-        # Wait for all workers to finish
-        try:
-            await self._task_group.__aexit__(None, None, None)
-        finally:
-            self._task_group = None
-    async def submit(self, item: Any) -> None:
-        """Submit an item for processing."""
-        if self._task_group is None:
-            raise RuntimeError("Worker pool is not started")
-        await self._queue[0].send(item)
-    async def _worker_loop(self) -> None:
-        """Main loop for worker tasks."""
         try:
-            async with self._queue[1]:
-                async for item in self._queue[1]:
-                    try:
-                        await self._worker_func(item)
-                    except Exception as e:
-                        logger.error(f"Worker error processing item: {e}")
-        except anyio.ClosedResourceError:
-            # Queue was closed, worker should exit gracefully
-            pass
-    async def __aenter__(self) -> WorkerPool:
-        """Enter the worker pool context."""
-        await self.start()
-        return self
+            result = await self._recv.receive()
+            self._completed_count += 1
+            return result
+        except anyio.EndOfStream:
+            raise StopAsyncIteration
+async def retry(
+    fn: Callable[[], Awaitable[T]],
+    *,
+    attempts: int = 3,
+    base_delay: float = 0.1,
+    max_delay: float = 2.0,
+    retry_on: tuple[type[BaseException], ...] = (Exception,),
+    jitter: float = 0.1,
+) -> T:
+    """Deadline-aware exponential backoff retry.
+    If an ambient effective deadline exists, cap each sleep so the retry loop
+    never outlives its parent scope.
+    Args:
+        fn: Async function to retry (takes no args)
+        attempts: Maximum retry attempts
+        base_delay: Initial delay between retries
+        max_delay: Maximum delay between retries
+        retry_on: Exception types that trigger retry
+        jitter: Random jitter added to delay (0.0 to 1.0)
+    Returns:
+        Result of successful function call
-    async def __aexit__(
-        self,
-        exc_type: type[BaseException] | None,
-        exc_val: BaseException | None,
-        exc_tb: TracebackType | None,
-    ) -> None:
-        """Exit the worker pool context."""
-        await self.stop()
+    Raises:
+        Last exception if all attempts fail
+    """
+    attempt = 0
+    deadline = effective_deadline()
+    while True:
+        try:
+            return await fn()
+        except retry_on as exc:
+            attempt += 1
+            if attempt >= attempts:
+                raise
+            delay = min(max_delay, base_delay * (2 ** (attempt - 1)))
+            if jitter:
+                import random
+                delay *= 1 + random.random() * jitter
+            # Cap by ambient deadline if one exists
+            if deadline is not None:
+                remaining = deadline - anyio.current_time()
+                if remaining <= 0:
+                    # Out of time; surface the last error
+                    raise
+                delay = min(delay, remaining)
+            await anyio.sleep(delay)

lionagi 0.15.14__py3-none-any.whl → 0.16.0__py3-none-any.whl

lionagi 0.15.14py3-none-any.whl → 0.16.0py3-none-any.whl