PyPI - pyochain - Versions diffs - 0.5.1__py3-none-any.whl → 0.5.31__py3-none-any.whl - Mend

pyochain 0.5.1py3-none-any.whl → 0.5.31py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of pyochain might be problematic. Click here for more details.

Files changed (35) hide show

pyochain/__init__.py +2 -2
pyochain/_core/__init__.py +3 -1
pyochain/_core/_format.py +34 -0
pyochain/_core/_main.py +65 -44
pyochain/_core/_protocols.py +2 -7
pyochain/_dict/__init__.py +1 -2
pyochain/_dict/_filters.py +17 -22
pyochain/_dict/_groups.py +7 -8
pyochain/_dict/_iter.py +52 -9
pyochain/_dict/_joins.py +11 -9
pyochain/_dict/_main.py +32 -226
pyochain/_dict/_maps.py +142 -0
pyochain/_dict/_nested.py +119 -65
pyochain/_dict/_process.py +40 -7
pyochain/_iter/_aggregations.py +1 -0
pyochain/_iter/_booleans.py +3 -0
pyochain/_iter/_dicts.py +243 -0
pyochain/_iter/_eager.py +60 -22
pyochain/_iter/_filters.py +31 -24
pyochain/_iter/_joins.py +13 -16
pyochain/_iter/_lists.py +11 -9
pyochain/_iter/_main.py +302 -60
pyochain/_iter/_maps.py +55 -39
pyochain/_iter/_partitions.py +11 -14
pyochain/_iter/_process.py +26 -44
pyochain/_iter/_rolling.py +22 -28
pyochain/_iter/_tuples.py +119 -14
{pyochain-0.5.1.dist-info → pyochain-0.5.31.dist-info}/METADATA +8 -42
pyochain-0.5.31.dist-info/RECORD +32 -0
pyochain/_dict/_exprs.py +0 -115
pyochain/_dict/_funcs.py +0 -62
pyochain/_iter/_constructors.py +0 -155
pyochain/_iter/_groups.py +0 -264
pyochain-0.5.1.dist-info/RECORD +0 -33
{pyochain-0.5.1.dist-info → pyochain-0.5.31.dist-info}/WHEEL +0 -0

pyochain/_dict/_process.py CHANGED Viewed

@@ -5,7 +5,7 @@ from typing import TYPE_CHECKING, Any, Concatenate
 import cytoolz as cz
-from .._core import MappingWrapper
+from .._core import MappingWrapper, SupportsRichComparison
 if TYPE_CHECKING:
     from ._main import Dict
@@ -44,7 +44,7 @@ class ProcessDict[K, V](MappingWrapper[K, V]):
                 func(k, v, *args, **kwargs)
             return data
-        return self.apply(_for_each)
+        return self._new(_for_each)
     def update_in(
         self, *keys: K, func: Callable[[V], V], default: V | None = None
@@ -80,7 +80,11 @@ class ProcessDict[K, V](MappingWrapper[K, V]):
         ```
         """
-        return self.apply(cz.dicttoolz.update_in, keys, func, default=default)
+        def _update_in(data: dict[K, V]) -> dict[K, V]:
+            return cz.dicttoolz.update_in(data, keys, func, default=default)
+        return self._new(_update_in)
     def with_key(self, key: K, value: V) -> Dict[K, V]:
         """
@@ -102,7 +106,11 @@ class ProcessDict[K, V](MappingWrapper[K, V]):
         ```
         """
-        return self.apply(cz.dicttoolz.assoc, key, value)
+        def _with_key(data: dict[K, V]) -> dict[K, V]:
+            return cz.dicttoolz.assoc(data, key, value)
+        return self._new(_with_key)
     def drop(self, *keys: K) -> Dict[K, V]:
         """
@@ -125,7 +133,11 @@ class ProcessDict[K, V](MappingWrapper[K, V]):
         ```
         """
-        return self.apply(cz.dicttoolz.dissoc, *keys)
+        def _drop(data: dict[K, V]) -> dict[K, V]:
+            return cz.dicttoolz.dissoc(data, *keys)
+        return self._new(_drop)
     def rename(self, mapping: Mapping[K, K]) -> Dict[K, V]:
         """
@@ -148,7 +160,7 @@ class ProcessDict[K, V](MappingWrapper[K, V]):
         def _rename(data: dict[K, V]) -> dict[K, V]:
             return {mapping.get(k, k): v for k, v in data.items()}
-        return self.apply(_rename)
+        return self._new(_rename)
     def sort(self, reverse: bool = False) -> Dict[K, V]:
         """
@@ -168,4 +180,25 @@ class ProcessDict[K, V](MappingWrapper[K, V]):
         def _sort(data: dict[K, V]) -> dict[K, V]:
             return dict(sorted(data.items(), reverse=reverse))
-        return self.apply(_sort)
+        return self._new(_sort)
+    def sort_values[U: SupportsRichComparison[Any]](
+        self: ProcessDict[K, U], reverse: bool = False
+    ) -> Dict[K, U]:
+        """
+        Sort the dictionary by its values and return a new Dict.
+        Args:
+            reverse: Whether to sort in descending order. Defaults to False.
+        ```python
+        >>> import pyochain as pc
+        >>> pc.Dict({"a": 2, "b": 1}).sort_values().unwrap()
+        {'b': 1, 'a': 2}
+        ```
+        """
+        def _sort_values(data: dict[K, U]) -> dict[K, U]:
+            return dict(sorted(data.items(), key=lambda item: item[1], reverse=reverse))
+        return self._new(_sort_values)

pyochain/_iter/_aggregations.py CHANGED Viewed

@@ -30,6 +30,7 @@ class BaseAgg[T](IterWrapper[T]):
         - one from the left elements of the pairs
         - one from the right elements.
         This function is, in some sense, the opposite of zip.
         ```python
         >>> import pyochain as pc

pyochain/_iter/_booleans.py CHANGED Viewed

@@ -21,6 +21,7 @@ class BaseBool[T](IterWrapper[T]):
         If any of them return false, it returns false.
         An empty iterator returns true.
         Args:
             predicate: Function to evaluate each item. Defaults to checking truthiness.
         Example:
@@ -57,6 +58,7 @@ class BaseBool[T](IterWrapper[T]):
         If they all return false, it returns false.
         An empty iterator returns false.
         Args:
             predicate: Function to evaluate each item. Defaults to checking truthiness.
         Example:
@@ -200,6 +202,7 @@ class BaseBool[T](IterWrapper[T]):
         - Returning the first element that satisfies the `predicate`.
         If all the elements return false, `Iter.find()` returns the default value.
         Args:
             default: Value to return if no element satisfies the predicate. Defaults to None.
             predicate: Function to evaluate each item. Defaults to checking truthiness.

pyochain/_iter/_dicts.py ADDED Viewed

@@ -0,0 +1,243 @@
+from __future__ import annotations
+from collections.abc import Callable, Iterable, Sequence
+from typing import TYPE_CHECKING, Any
+import cytoolz as cz
+from .._core import IterWrapper
+if TYPE_CHECKING:
+    from .._dict import Dict
+class BaseDict[T](IterWrapper[T]):
+    def with_keys[K](self, keys: Iterable[K]) -> Dict[K, T]:
+        """
+        Create a Dict by zipping the iterable with keys.
+        Args:
+            keys: Iterable of keys to pair with the values.
+        Example:
+        ```python
+        >>> import pyochain as pc
+        >>> keys = ["a", "b", "c"]
+        >>> values = [1, 2, 3]
+        >>> pc.Iter.from_(values).with_keys(keys).unwrap()
+        {'a': 1, 'b': 2, 'c': 3}
+        >>> # This is equivalent to:
+        >>> pc.Iter.from_(keys).zip(values).pipe(
+        ...     lambda x: pc.Dict(x.into(dict)).unwrap()
+        ... )
+        {'a': 1, 'b': 2, 'c': 3}
+        ```
+        """
+        from .._dict import Dict
+        def _with_keys(data: Iterable[T]) -> Dict[K, T]:
+            return Dict(dict(zip(keys, data)))
+        return self.into(_with_keys)
+    def with_values[V](self, values: Iterable[V]) -> Dict[T, V]:
+        """
+        Create a Dict by zipping the iterable with values.
+        Args:
+            values: Iterable of values to pair with the keys.
+        Example:
+        ```python
+        >>> import pyochain as pc
+        >>> keys = [1, 2, 3]
+        >>> values = ["a", "b", "c"]
+        >>> pc.Iter.from_(keys).with_values(values).unwrap()
+        {1: 'a', 2: 'b', 3: 'c'}
+        >>> # This is equivalent to:
+        >>> pc.Iter.from_(keys).zip(values).pipe(
+        ...     lambda x: pc.Dict(x.into(dict)).unwrap()
+        ... )
+        {1: 'a', 2: 'b', 3: 'c'}
+        ```
+        """
+        from .._dict import Dict
+        def _with_values(data: Iterable[T]) -> Dict[T, V]:
+            return Dict(dict(zip(data, values)))
+        return self.into(_with_values)
+    def reduce_by[K](
+        self, key: Callable[[T], K], binop: Callable[[T, T], T]
+    ) -> Dict[K, T]:
+        """
+        Perform a simultaneous groupby and reduction.
+        Args:
+            key: Function to compute the key for grouping.
+            binop: Binary operation to reduce the grouped elements.
+        Example:
+        ```python
+        >>> from collections.abc import Iterable
+        >>> import pyochain as pc
+        >>> from operator import add, mul
+        >>>
+        >>> def is_even(x: int) -> bool:
+        ...     return x % 2 == 0
+        >>>
+        >>> def group_reduce(data: Iterable[int]) -> int:
+        ...     return pc.Iter.from_(data).reduce(add)
+        >>>
+        >>> data = pc.Seq([1, 2, 3, 4, 5])
+        >>> data.iter().reduce_by(is_even, add).unwrap()
+        {False: 9, True: 6}
+        >>> data.iter().group_by(is_even).map_values(group_reduce).unwrap()
+        {False: 9, True: 6}
+        ```
+        But the former does not build the intermediate groups, allowing it to operate in much less space.
+        This makes it suitable for larger datasets that do not fit comfortably in memory
+        Simple Examples:
+        ```python
+        >>> pc.Iter.from_([1, 2, 3, 4, 5]).reduce_by(is_even, add).unwrap()
+        {False: 9, True: 6}
+        >>> pc.Iter.from_([1, 2, 3, 4, 5]).reduce_by(is_even, mul).unwrap()
+        {False: 15, True: 8}
+        ```
+        """
+        from .._dict import Dict
+        def _reduce_by(data: Iterable[T]) -> Dict[K, T]:
+            return Dict(cz.itertoolz.reduceby(key, binop, data))
+        return self.into(_reduce_by)
+    def group_by[K](self, on: Callable[[T], K]) -> Dict[K, list[T]]:
+        """
+        Group elements by key function and return a Dict result.
+        Args:
+            on: Function to compute the key for grouping.
+        Example:
+        ```python
+        >>> import pyochain as pc
+        >>> names = [
+        ...     "Alice",
+        ...     "Bob",
+        ...     "Charlie",
+        ...     "Dan",
+        ...     "Edith",
+        ...     "Frank",
+        ... ]
+        >>> pc.Iter.from_(names).group_by(len).sort()
+        ... # doctest: +NORMALIZE_WHITESPACE
+        {3: ['Bob', 'Dan'], 5: ['Alice', 'Edith', 'Frank'], 7: ['Charlie']}
+        >>>
+        >>> iseven = lambda x: x % 2 == 0
+        >>> pc.Iter.from_([1, 2, 3, 4, 5, 6, 7, 8]).group_by(iseven)
+        ... # doctest: +NORMALIZE_WHITESPACE
+        {False: [1, 3, 5, 7], True: [2, 4, 6, 8]}
+        ```
+        Non-callable keys imply grouping on a member.
+        ```python
+        >>> data = [
+        ...     {"name": "Alice", "gender": "F"},
+        ...     {"name": "Bob", "gender": "M"},
+        ...     {"name": "Charlie", "gender": "M"},
+        ... ]
+        >>> pc.Iter.from_(data).group_by("gender").sort()
+        ... # doctest: +NORMALIZE_WHITESPACE
+        {'F': [{'gender': 'F', 'name': 'Alice'}],
+        'M': [{'gender': 'M', 'name': 'Bob'}, {'gender': 'M', 'name': 'Charlie'}]}
+        ```
+        """
+        from .._dict import Dict
+        def _group_by(data: Iterable[T]) -> Dict[K, list[T]]:
+            return Dict(cz.itertoolz.groupby(on, data))
+        return self.into(_group_by)
+    def frequencies(self) -> Dict[T, int]:
+        """
+        Find number of occurrences of each value in the iterable.
+        ```python
+        >>> import pyochain as pc
+        >>> data = ["cat", "cat", "ox", "pig", "pig", "cat"]
+        >>> pc.Iter.from_(data).frequencies().unwrap()
+        {'cat': 3, 'ox': 1, 'pig': 2}
+        ```
+        """
+        from .._dict import Dict
+        def _frequencies(data: Iterable[T]) -> Dict[T, int]:
+            return Dict(cz.itertoolz.frequencies(data))
+        return self.into(_frequencies)
+    def count_by[K](self, key: Callable[[T], K]) -> Dict[K, int]:
+        """
+        Count elements of a collection by a key function.
+        Args:
+            key: Function to compute the key for counting.
+        Example:
+        ```python
+        >>> import pyochain as pc
+        >>> pc.Iter.from_(["cat", "mouse", "dog"]).count_by(len).unwrap()
+        {3: 2, 5: 1}
+        >>> def iseven(x):
+        ...     return x % 2 == 0
+        >>> pc.Iter.from_([1, 2, 3]).count_by(iseven).unwrap()
+        {False: 2, True: 1}
+        ```
+        """
+        from .._dict import Dict
+        def _count_by(data: Iterable[T]) -> Dict[K, int]:
+            return Dict(cz.recipes.countby(key, data))
+        return self.into(_count_by)
+    def to_records[U: Sequence[Any]](self: BaseDict[U]) -> Dict[Any, Any]:
+        """
+        Transform an iterable of nested sequences into a nested dictionary.
+        - Each inner sequence represents a path to a value in the dictionary.
+        - The last element of each sequence is treated as the value
+        - All preceding elements are treated as keys leading to that value.
+        Example:
+        ```python
+        >>> import pyochain as pc
+        >>> arrays = [["a", "b", 1], ["a", "c", 2], ["d", 3]]
+        >>> pc.Seq(arrays).to_records().unwrap()
+        {'a': {'b': 1, 'c': 2}, 'd': 3}
+        ```
+        """
+        from .._dict import Dict
+        def _from_nested(
+            arrays: Iterable[Sequence[Any]], parent: dict[Any, Any] | None = None
+        ) -> dict[Any, Any]:
+            """from dictutils.pivot"""
+            d: dict[Any, Any] = parent or {}
+            for arr in arrays:
+                if len(arr) >= 2:
+                    head, *tail = arr
+                    if len(tail) == 1:
+                        d[head] = tail[0]
+                    else:
+                        d[head] = _from_nested([tail], d.get(head, {}))
+            return d
+        return Dict(self.into(_from_nested))

pyochain/_iter/_eager.py CHANGED Viewed

@@ -1,6 +1,6 @@
 from __future__ import annotations
-from collections.abc import Callable, Iterable
+from collections.abc import Callable, Iterable, Sequence
 from functools import partial
 from typing import TYPE_CHECKING, Any
@@ -38,7 +38,7 @@ class BaseEager[T](IterWrapper[T]):
         def _sort(data: Iterable[U]) -> list[U]:
             return sorted(data, reverse=reverse, key=key)
-        return self.collect(_sort)
+        return self._eager(_sort)
     def tail(self, n: int) -> Seq[T]:
         """
@@ -54,7 +54,7 @@ class BaseEager[T](IterWrapper[T]):
         ```
         """
-        return self.collect(partial(cz.itertoolz.tail, n))
+        return self._eager(partial(cz.itertoolz.tail, n))
     def top_n(self, n: int, key: Callable[[T], Any] | None = None) -> Seq[T]:
         """
@@ -71,7 +71,7 @@ class BaseEager[T](IterWrapper[T]):
         ```
         """
-        return self.collect(partial(cz.itertoolz.topk, n, key=key))
+        return self._eager(partial(cz.itertoolz.topk, n, key=key))
     def union(self, *others: Iterable[T]) -> Seq[T]:
         """
@@ -91,10 +91,10 @@ class BaseEager[T](IterWrapper[T]):
         ```
         """
-        def _union(data: Iterable[T]) -> set[T]:
-            return set(data).union(*others)
+        def _union(data: Iterable[T]) -> list[T]:
+            return list(set(data).union(*others))
-        return self.collect(_union)
+        return self._eager(_union)
     def intersection(self, *others: Iterable[T]) -> Seq[T]:
         """
@@ -109,15 +109,15 @@ class BaseEager[T](IterWrapper[T]):
         ```python
         >>> import pyochain as pc
         >>> pc.Iter.from_([1, 2, 2]).intersection([2, 3], [2]).unwrap()
-        {2}
+        [2]
         ```
         """
-        def _intersection(data: Iterable[T]) -> set[T]:
-            return set(data).intersection(*others)
+        def _intersection(data: Iterable[T]) -> list[T]:
+            return list(set(data).intersection(*others))
-        return self.collect(_intersection)
+        return self._eager(_intersection)
     def diff_unique(self, *others: Iterable[T]) -> Seq[T]:
         """
@@ -133,15 +133,15 @@ class BaseEager[T](IterWrapper[T]):
         ```python
         >>> import pyochain as pc
         >>> pc.Iter.from_([1, 2, 2]).diff_unique([2, 3]).unwrap()
-        {1}
+        [1]
         ```
         """
-        def _difference(data: Iterable[T]) -> set[T]:
-            return set(data).difference(*others)
+        def _difference(data: Iterable[T]) -> list[T]:
+            return list(set(data).difference(*others))
-        return self.collect(_difference)
+        return self._eager(_difference)
     def diff_symmetric(self, *others: Iterable[T]) -> Seq[T]:
         """
@@ -163,10 +163,10 @@ class BaseEager[T](IterWrapper[T]):
         ```
         """
-        def _symmetric_difference(data: Iterable[T]) -> set[T]:
-            return set(data).symmetric_difference(*others)
+        def _symmetric_difference(data: Iterable[T]) -> list[T]:
+            return list(set(data).symmetric_difference(*others))
-        return self.collect(_symmetric_difference)
+        return self._eager(_symmetric_difference)
     def most_common(self, n: int | None = None) -> Seq[tuple[T, int]]:
         """
@@ -176,7 +176,6 @@ class BaseEager[T](IterWrapper[T]):
         Args:
             n: Number of most common elements to return. Defaults to None (all elements).
         Example:
         ```python
         >>> import pyochain as pc
@@ -187,9 +186,48 @@ class BaseEager[T](IterWrapper[T]):
         """
         from collections import Counter
-        from ._main import Seq
         def _most_common(data: Iterable[T]) -> list[tuple[T, int]]:
             return Counter(data).most_common(n)
-        return Seq(self.into(_most_common))
+        return self._eager(_most_common)
+    def rearrange[U: Sequence[Any]](self: BaseEager[U], *indices: int) -> Seq[list[U]]:
+        """
+        Rearrange elements in a given list of arrays by order indices.
+        The last element (value) always remains in place.
+        Args:
+            order: List of indices specifying new order of keys
+        Raises:
+            IndexError: If any index in order is out of range for the row
+        Example:
+        ```python
+        >>> import pyochain as pc
+        >>> data = pc.Seq([["A", "X", 1], ["A", "Y", 2], ["B", "X", 3], ["B", "Y", 4]])
+        >>> data.rearrange(1, 0).unwrap()
+        [['X', 'A', 1], ['Y', 'A', 2], ['X', 'B', 3], ['Y', 'B', 4]]
+        ```
+        """
+        def _rearrange(in_arrs: Iterable[U]) -> list[list[U]]:
+            """from dictutils.pivot"""
+            order = indices
+            out: list[list[U]] = []
+            for arr in in_arrs:
+                max_key_index: int = len(arr) - 2
+                for i in order:
+                    if i < 0 or i > max_key_index:
+                        raise IndexError(
+                            f"order index {i} out of range for row with {max_key_index + 1} keys"
+                        )
+                out.append([arr[i] for i in order] + [arr[-1]])
+            return out
+        return self._eager(_rearrange)

pyochain 0.5.1__py3-none-any.whl → 0.5.31__py3-none-any.whl

Potentially problematic release.

pyochain 0.5.1py3-none-any.whl → 0.5.31py3-none-any.whl