PyPI - shrinkray - Versions diffs - 0.0.0__py3-none-any.whl → 25.12.26.0__py3-none-any.whl - Mend

shrinkray 0.0.0py3-none-any.whl → 25.12.26.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (33) hide show

shrinkray/__main__.py +130 -960
shrinkray/cli.py +70 -0
shrinkray/display.py +75 -0
shrinkray/formatting.py +108 -0
shrinkray/passes/bytes.py +217 -10
shrinkray/passes/clangdelta.py +47 -17
shrinkray/passes/definitions.py +84 -4
shrinkray/passes/genericlanguages.py +61 -7
shrinkray/passes/json.py +6 -0
shrinkray/passes/patching.py +65 -57
shrinkray/passes/python.py +66 -23
shrinkray/passes/sat.py +505 -91
shrinkray/passes/sequences.py +26 -6
shrinkray/problem.py +206 -27
shrinkray/process.py +49 -0
shrinkray/reducer.py +187 -25
shrinkray/state.py +599 -0
shrinkray/subprocess/__init__.py +24 -0
shrinkray/subprocess/client.py +253 -0
shrinkray/subprocess/protocol.py +190 -0
shrinkray/subprocess/worker.py +491 -0
shrinkray/tui.py +915 -0
shrinkray/ui.py +72 -0
shrinkray/work.py +34 -6
{shrinkray-0.0.0.dist-info → shrinkray-25.12.26.0.dist-info}/METADATA +44 -27
shrinkray-25.12.26.0.dist-info/RECORD +33 -0
{shrinkray-0.0.0.dist-info → shrinkray-25.12.26.0.dist-info}/WHEEL +2 -1
shrinkray-25.12.26.0.dist-info/entry_points.txt +3 -0
shrinkray-25.12.26.0.dist-info/top_level.txt +1 -0
shrinkray/learning.py +0 -221
shrinkray-0.0.0.dist-info/RECORD +0 -22
shrinkray-0.0.0.dist-info/entry_points.txt +0 -3
{shrinkray-0.0.0.dist-info → shrinkray-25.12.26.0.dist-info/licenses}/LICENSE +0 -0

shrinkray/passes/sequences.py CHANGED Viewed

@@ -1,14 +1,18 @@
 from collections import defaultdict
-from typing import Any, Sequence, TypeVar
+from collections.abc import Sequence
+from typing import Any
 from shrinkray.passes.definitions import ReductionPass
 from shrinkray.passes.patching import CutPatch, Cuts, apply_patches
 from shrinkray.problem import ReductionProblem
-Seq = TypeVar("Seq", bound=Sequence[Any])
+async def delete_elements[Seq: Sequence[Any]](problem: ReductionProblem[Seq]) -> None:
+    """Try to delete individual elements from the sequence.
-async def delete_elements(problem: ReductionProblem[Seq]) -> None:
+    Creates a patch for each element and uses the patch applier to find
+    which elements can be removed while maintaining interestingness.
+    """
     await apply_patches(
         problem, Cuts(), [[(i, i + 1)] for i in range(len(problem.current_test_case))]
     )
@@ -24,7 +28,9 @@ def merged_intervals(intervals: list[tuple[int, int]]) -> list[tuple[int, int]]:
     return list(map(tuple, normalized))  # type: ignore
-def with_deletions(target: Seq, deletions: list[tuple[int, int]]) -> Seq:
+def with_deletions[Seq: Sequence[Any]](
+    target: Seq, deletions: list[tuple[int, int]]
+) -> Seq:
     result: list[Any] = []
     prev = 0
     total_deleted = 0
@@ -37,7 +43,15 @@ def with_deletions(target: Seq, deletions: list[tuple[int, int]]) -> Seq:
     return type(target)(result)  # type: ignore
-def block_deletion(min_block: int, max_block: int) -> ReductionPass[Seq]:
+def block_deletion[Seq: Sequence[Any]](
+    min_block: int, max_block: int
+) -> ReductionPass[Seq]:
+    """Create a pass that deletes contiguous blocks of elements.
+    Tries to remove blocks of size min_block to max_block, starting at
+    various offsets. Useful for removing larger chunks efficiently.
+    """
     async def apply(problem: ReductionProblem[Seq]) -> None:
         n = len(problem.current_test_case)
         if n <= min_block:
@@ -55,7 +69,13 @@ def block_deletion(min_block: int, max_block: int) -> ReductionPass[Seq]:
     return apply
-async def delete_duplicates(problem: ReductionProblem[Seq]) -> None:
+async def delete_duplicates[Seq: Sequence[Any]](problem: ReductionProblem[Seq]) -> None:
+    """Try to delete duplicate elements from the sequence.
+    Groups elements by value and tries to remove all occurrences of each
+    duplicated element together. Effective when the test case contains
+    repeated patterns that can be eliminated.
+    """
     index: dict[int, list[int]] = defaultdict(list)
     for i, c in enumerate(problem.current_test_case):

shrinkray/problem.py CHANGED Viewed

@@ -1,8 +1,28 @@
+"""Core abstractions for test-case reduction.
+This module defines the fundamental interfaces for reduction problems:
+- ReductionProblem[T]: The central abstraction representing a reduction task
+- BasicReductionProblem[T]: A concrete implementation with caching and callbacks
+- View[S, T]: A problem wrapper that parses through a Format
+The key insight is that all reduction is about finding the smallest test case
+that satisfies an "interestingness" predicate. The problem abstraction hides
+the details of caching, parallelism, and state management.
+"""
 import hashlib
 import time
-from abc import ABC, abstractmethod, abstractproperty
+from abc import ABC, abstractmethod
+from collections.abc import Awaitable, Callable, Sized
 from datetime import timedelta
-from typing import Any, Awaitable, Callable, Generic, Optional, TypeVar, cast
+from typing import (
+    TYPE_CHECKING,
+    Any,
+    Protocol,
+    TypeVar,
+    cast,
+)
 import attrs
 import trio
@@ -11,16 +31,48 @@ from humanize import naturalsize, precisedelta
 from shrinkray.work import WorkContext
+if TYPE_CHECKING:
+    from shrinkray.passes.definitions import Format
 S = TypeVar("S")
 T = TypeVar("T")
-def shortlex(value: Any) -> Any:
+class PassStatsProtocol(Protocol):
+    """Protocol for pass statistics tracking.
+    This allows problem.py to track stats without importing from reducer.py,
+    avoiding circular dependencies.
+    """
+    test_evaluations: int
+    successful_reductions: int
+    bytes_deleted: int
+def shortlex[SizedT: Sized](value: SizedT) -> tuple[int, SizedT]:
+    """Return a comparison key for shortlex ordering.
+    Shortlex ordering compares first by length, then lexicographically.
+    This ensures shorter test cases are always preferred, and among
+    equal-length test cases, lexicographically smaller ones win.
+    This ordering is crucial for reproducibility: regardless of which
+    reduction path is taken, the final result should be the same minimal
+    test case.
+    Example:
+        >>> shortlex(b"aa") < shortlex(b"aaa")  # shorter wins
+        True
+        >>> shortlex(b"ab") < shortlex(b"ba")   # same length, lex order
+        True
+    """
     return (len(value), value)
 def default_sort_key(value: Any):
-    if isinstance(value, (str, bytes)):
+    if isinstance(value, str | bytes):
         return shortlex(value)
     else:
         return shortlex(repr(value))
@@ -99,15 +151,57 @@ class ReductionStats:
 @define(slots=False)
-class ReductionProblem(Generic[T], ABC):
+class ReductionProblem[T](ABC):
+    """Abstract base class representing a test-case reduction task.
+    A ReductionProblem encapsulates everything needed to reduce a test case:
+    - The current best-known interesting test case
+    - A predicate to test if candidates are "interesting" (trigger the bug)
+    - An ordering to determine which test cases are "smaller"
+    Reduction passes work by generating candidate test cases and calling
+    is_interesting() on them. When a smaller interesting test case is found,
+    current_test_case is automatically updated.
+    The problem maintains a cache of interestingness results and tracks
+    statistics about the reduction process.
+    Subclasses must implement:
+    - current_test_case: Property returning the current best test case
+    - is_interesting(test_case): Async method testing if a candidate works
+    - sort_key(test_case): Returns a comparable key for ordering
+    - size(test_case): Returns the size of a test case
+    - display(value): Returns a human-readable representation
+    """
     work: WorkContext
+    # Track current pass stats for real-time updates (set by reducer)
+    current_pass_stats: PassStatsProtocol | None = None
     def __attrs_post_init__(self) -> None:
+        # Cache of View objects for each Format, to avoid re-parsing
         self.__view_cache: dict[Any, ReductionProblem[Any]] = {}
     def view(
         self, format: "Format[T, S] | type[Format[T, S]]"
     ) -> "ReductionProblem[S]":
+        """Create a view of this problem through a Format.
+        A View wraps this problem, parsing the current test case through
+        the format's parse() method and serializing candidates back through
+        dumps(). This allows format-specific passes to work on structured
+        data while the underlying problem operates on bytes.
+        Example:
+            # Work on lines instead of raw bytes
+            line_problem = byte_problem.view(Split(b"\\n"))
+            # Work on JSON structure
+            json_problem = byte_problem.view(JSON)
+        Views are cached: calling view() with the same format returns the
+        same View object, avoiding redundant parsing.
+        """
         try:
             return cast(ReductionProblem[S], self.__view_cache[format])
         except KeyError:
@@ -124,17 +218,32 @@ class ReductionProblem(Generic[T], ABC):
         return cast(ReductionProblem[S], self.__view_cache.setdefault(format, result))
-    async def setup(self) -> None:
-        pass
+    async def setup(self) -> None:  # noqa: B027
+        """Initialize the problem before reduction begins.
+        Subclasses may override this to perform validation or initialization.
+        The default implementation does nothing.
+        """
-    @abstractproperty
+    @property
+    @abstractmethod
     def current_test_case(self) -> T: ...
+    @property
+    @abstractmethod
+    def stats(self) -> ReductionStats: ...
     @abstractmethod
     async def is_interesting(self, test_case: T) -> bool:
         pass
     async def is_reduction(self, test_case: T) -> bool:
+        """Check if test_case would be a valid reduction from current state.
+        A valid reduction is an interesting test case that is smaller than
+        the current one (according to sort_key). This is a convenience method
+        that short-circuits if the candidate is larger.
+        """
         if test_case == self.current_test_case:
             return True
         if self.sort_key(test_case) > self.sort_key(self.current_test_case):
@@ -156,6 +265,23 @@ class ReductionProblem(Generic[T], ABC):
     def display(self, value: T) -> str: ...
     def backtrack(self, new_test_case: T) -> "ReductionProblem[T]":
+        """Create a new problem starting from a different test case.
+        This is used by reduction pumps to try larger test cases temporarily.
+        The new problem shares the same is_interesting predicate but starts
+        from new_test_case instead of current_test_case.
+        If reduction succeeds and the result is smaller than the original
+        current_test_case, it can be adopted into the main problem.
+        Example:
+            # Pump inlines a function, making code larger
+            pumped = await pump(problem)  # Returns larger test case
+            backtracked = problem.backtrack(pumped)
+            # Try to reduce the larger test case
+            await run_passes(backtracked)
+            # If result is smaller than original, keep it
+        """
         return BasicReductionProblem(
             initial=new_test_case,
             is_interesting=self.is_interesting,
@@ -181,6 +307,20 @@ def default_cache_key(value: Any) -> str:
 class BasicReductionProblem(ReductionProblem[T]):
+    """Concrete implementation of ReductionProblem for in-memory reduction.
+    This is the main implementation used by Shrink Ray. It provides:
+    - Caching of interestingness results (by content hash)
+    - Statistics tracking (calls, cache hits, timing)
+    - Callbacks for reduction events
+    - Automatic cache clearing when a reduction succeeds
+    The cache clearing is a practical choice: when we find a smaller test case,
+    cached results for candidates derived from the old test case are no longer
+    useful (we're now reducing from a different starting point). Clearing the
+    cache saves memory and avoids serving stale cache entries that won't help.
+    """
     def __init__(
         self,
         initial: T,
@@ -189,7 +329,7 @@ class BasicReductionProblem(ReductionProblem[T]):
         sort_key: Callable[[T], Any] = default_sort_key,
         size: Callable[[T], int] = default_size,
         display: Callable[[T], str] = default_display,
-        stats: Optional[ReductionStats] = None,
+        stats: ReductionStats | None = None,
         cache_key: Callable[[Any], str] = default_cache_key,
     ):
         super().__init__(work=work)
@@ -198,11 +338,11 @@ class BasicReductionProblem(ReductionProblem[T]):
         self.__size = size
         self.__display = display
         if stats is None:
-            self.stats = ReductionStats()
-            self.stats.initial_test_case_size = self.size(initial)
-            self.stats.current_test_case_size = self.size(initial)
+            self._stats = ReductionStats()
+            self._stats.initial_test_case_size = self.size(initial)
+            self._stats.current_test_case_size = self.size(initial)
         else:
-            self.stats = stats
+            self._stats = stats
         self.__is_interesting_cache: dict[str, bool] = {}
         self.__cache_key = cache_key
@@ -223,6 +363,10 @@ class BasicReductionProblem(ReductionProblem[T]):
     def display(self, value: T) -> str:
         return self.__display(value)
+    @property
+    def stats(self) -> ReductionStats:
+        return self._stats
     def sort_key(self, test_case: T) -> Any:
         return self.__sort_key(test_case)
@@ -234,31 +378,43 @@ class BasicReductionProblem(ReductionProblem[T]):
         call `fn` with the new value. Note that these are called outside the lock."""
         self.__on_reduce_callbacks.append(callback)
-    async def is_interesting(self, value: T) -> bool:
-        """Returns true if this value is interesting."""
+    async def is_interesting(self, test_case: T) -> bool:
+        """Returns true if this test_case is interesting."""
         await trio.lowlevel.checkpoint()
-        if value == self.current_test_case:
+        if test_case == self.current_test_case:
             return True
-        cache_key = self.__cache_key(value)
+        cache_key = self.__cache_key(test_case)
         try:
             return self.__is_interesting_cache[cache_key]
         except KeyError:
             pass
-        result = await self.__is_interesting(value)
+        result = await self.__is_interesting(test_case)
         self.__is_interesting_cache[cache_key] = result
         self.stats.failed_reductions += 1
         self.stats.calls += 1
+        # Update current pass stats if a pass is running
+        if self.current_pass_stats is not None:
+            self.current_pass_stats.test_evaluations += 1
         if result:
             self.stats.interesting_calls += 1
-            if self.sort_key(value) < self.sort_key(self.current_test_case):
+            if self.sort_key(test_case) < self.sort_key(self.current_test_case):
                 self.__is_interesting_cache.clear()
                 self.stats.failed_reductions -= 1
                 self.stats.reductions += 1
                 self.stats.time_of_last_reduction = time.time()
-                self.stats.current_test_case_size = self.size(value)
-                self.__current = value
+                # Update current pass stats for reductions
+                if self.current_pass_stats is not None:
+                    self.current_pass_stats.successful_reductions += 1
+                    size_diff = self.size(self.current_test_case) - self.size(test_case)
+                    self.current_pass_stats.bytes_deleted += size_diff
+                self.stats.current_test_case_size = self.size(test_case)
+                self.__current = test_case
                 for f in self.__on_reduce_callbacks:
-                    await f(value)
+                    await f(test_case)
             else:
                 self.stats.wasted_interesting_calls += 1
         return result
@@ -268,14 +424,32 @@ class BasicReductionProblem(ReductionProblem[T]):
         return self.__current
-class View(ReductionProblem[T], Generic[S, T]):
+class View[S, T](ReductionProblem[T]):
+    """A view of a ReductionProblem through a parse/dump transformation.
+    View wraps an underlying problem, presenting it as a different type.
+    For example, a problem over bytes can be viewed as a problem over
+    lists of lines, or JSON structures, or AST nodes.
+    The View:
+    - Parses the underlying problem's test case on access
+    - Dumps candidates back to the underlying type for testing
+    - Caches the parsed representation for efficiency
+    - Delegates interestingness testing to the underlying problem
+    The caching is subtle: when the underlying problem's test case changes,
+    the View re-parses it. But it only updates its cached value if the new
+    parsed value is "smaller" (according to sort_key), to maintain
+    monotonicity of reduction.
+    """
     def __init__(
         self,
         problem: ReductionProblem[S],
         parse: Callable[[S], T],
         dump: Callable[[T], S],
-        work: Optional[WorkContext] = None,
-        sort_key: Optional[Callable[[T], Any]] = None,
+        work: WorkContext | None = None,
+        sort_key: Callable[[T], Any] | None = None,
     ):
         super().__init__(work=work or problem.work)
         self.__problem = problem
@@ -292,7 +466,7 @@ class View(ReductionProblem[T], Generic[S, T]):
     @property
     def stats(self) -> ReductionStats:
-        return self.__problem.stats  # type: ignore
+        return self.__problem.stats
     @property
     def current_test_case(self) -> T:
@@ -307,7 +481,12 @@ class View(ReductionProblem[T], Generic[S, T]):
         return self.__current
     async def is_interesting(self, test_case: T) -> bool:
-        return await self.__problem.is_interesting(self.__dump(test_case))
+        from shrinkray.passes.definitions import DumpError
+        try:
+            return await self.__problem.is_interesting(self.__dump(test_case))
+        except DumpError:
+            return False
     def sort_key(self, test_case: T) -> Any:
         if self.__sort_key is not None:

shrinkray/process.py ADDED Viewed

@@ -0,0 +1,49 @@
+"""Process management utilities for shrink ray."""
+import os
+import random
+import signal
+import trio
+def signal_group(sp: "trio.Process", sig: int) -> None:
+    """Send a signal to a process group."""
+    gid = os.getpgid(sp.pid)
+    assert gid != os.getgid()
+    os.killpg(gid, sig)
+async def interrupt_wait_and_kill(sp: "trio.Process", delay: float = 0.1) -> None:
+    """Interrupt a process, wait for it to exit, and kill it if necessary."""
+    await trio.lowlevel.checkpoint()
+    if sp.returncode is None:
+        try:
+            # In case the subprocess forked. Python might hang if you don't close
+            # all pipes.
+            for pipe in [sp.stdout, sp.stderr, sp.stdin]:
+                if pipe:
+                    await pipe.aclose()
+            signal_group(sp, signal.SIGINT)
+            for n in range(10):
+                if sp.poll() is not None:
+                    return
+                await trio.sleep(delay * 1.5**n * random.random())
+        except ProcessLookupError:  # pragma: no cover
+            # This is incredibly hard to trigger reliably, because it only happens
+            # if the process exits at exactly the wrong time.
+            pass
+        if sp.returncode is None:
+            try:
+                signal_group(sp, signal.SIGKILL)
+            except ProcessLookupError:
+                pass
+        with trio.move_on_after(delay):
+            await sp.wait()
+        if sp.returncode is None:
+            raise ValueError(
+                f"Could not kill subprocess with pid {sp.pid}. Something has gone seriously wrong."
+            )

shrinkray 0.0.0__py3-none-any.whl → 25.12.26.0__py3-none-any.whl

shrinkray 0.0.0py3-none-any.whl → 25.12.26.0py3-none-any.whl