PyPI - onnx-diagnostic - Versions diffs - 0.7.16__py3-none-any.whl → 0.8.1__py3-none-any.whl - Mend

onnx-diagnostic 0.7.16py3-none-any.whl → 0.8.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (38) hide show

onnx_diagnostic/__init__.py +1 -1
onnx_diagnostic/_command_lines_parser.py +78 -22
onnx_diagnostic/export/api.py +124 -0
onnx_diagnostic/export/dynamic_shapes.py +2 -1
onnx_diagnostic/export/shape_helper.py +47 -70
onnx_diagnostic/ext_test_case.py +11 -0
onnx_diagnostic/helpers/cache_helper.py +38 -7
onnx_diagnostic/helpers/fake_tensor_helper.py +224 -104
onnx_diagnostic/helpers/helper.py +27 -33
onnx_diagnostic/helpers/log_helper.py +109 -5
onnx_diagnostic/helpers/memory_peak.py +2 -0
onnx_diagnostic/helpers/mini_onnx_builder.py +1 -1
onnx_diagnostic/helpers/model_builder_helper.py +132 -2
onnx_diagnostic/helpers/onnx_helper.py +1 -1
onnx_diagnostic/helpers/ort_session.py +4 -0
onnx_diagnostic/helpers/rt_helper.py +393 -43
onnx_diagnostic/helpers/torch_helper.py +20 -1
onnx_diagnostic/tasks/__init__.py +7 -0
onnx_diagnostic/tasks/automatic_speech_recognition.py +2 -8
onnx_diagnostic/tasks/feature_extraction.py +2 -8
onnx_diagnostic/tasks/image_text_to_text.py +10 -8
onnx_diagnostic/tasks/summarization.py +2 -8
onnx_diagnostic/tasks/text2text_generation.py +3 -8
onnx_diagnostic/tasks/text_generation.py +86 -65
onnx_diagnostic/torch_export_patches/onnx_export_errors.py +718 -438
onnx_diagnostic/torch_export_patches/patch_details.py +340 -0
onnx_diagnostic/torch_export_patches/patch_inputs.py +1 -1
onnx_diagnostic/torch_export_patches/patch_module.py +9 -36
onnx_diagnostic/torch_export_patches/patches/patch_torch.py +12 -6
onnx_diagnostic/torch_export_patches/patches/patch_transformers.py +162 -24
onnx_diagnostic/torch_export_patches/serialization/transformers_impl.py +140 -104
onnx_diagnostic/torch_models/untrained/llm_phi2.py +1 -4
onnx_diagnostic/torch_models/validate.py +626 -228
{onnx_diagnostic-0.7.16.dist-info → onnx_diagnostic-0.8.1.dist-info}/METADATA +1 -1
{onnx_diagnostic-0.7.16.dist-info → onnx_diagnostic-0.8.1.dist-info}/RECORD +38 -36
{onnx_diagnostic-0.7.16.dist-info → onnx_diagnostic-0.8.1.dist-info}/WHEEL +0 -0
{onnx_diagnostic-0.7.16.dist-info → onnx_diagnostic-0.8.1.dist-info}/licenses/LICENSE.txt +0 -0
{onnx_diagnostic-0.7.16.dist-info → onnx_diagnostic-0.8.1.dist-info}/top_level.txt +0 -0

onnx_diagnostic/torch_export_patches/patch_details.py ADDED Viewed

@@ -0,0 +1,340 @@
+import difflib
+import inspect
+import pprint
+import re
+import textwrap
+from typing import Any, Dict, Callable, List, Optional, Tuple, Union
+def clean_code_with_black(code: str) -> str:
+    """Changes the code style with :epkg:`black` if available."""
+    code = textwrap.dedent(code)
+    try:
+        import black
+    except ImportError:
+        return code
+    try:
+        return black.format_str(code, mode=black.FileMode(line_length=98))
+    except black.parsing.InvalidInput as e:
+        raise RuntimeError(f"Unable to parse code\n\n---\n{code}\n---\n") from e
+def make_diff_code(code1: str, code2: str, output: Optional[str] = None) -> str:
+    """
+    Creates a diff between two codes.
+    :param code1: first code
+    :param code2: second code
+    :param output: if not empty, stores the output in this file
+    :return: diff
+    """
+    text = "\n".join(
+        difflib.unified_diff(
+            code1.strip().splitlines(),
+            code2.strip().splitlines(),
+            fromfile="original",
+            tofile="rewritten",
+            lineterm="",
+        )
+    )
+    if output:
+        with open(output, "w") as f:
+            f.write(text)
+    return text
+class PatchInfo:
+    """
+    Stores information about patches.
+    :param function_to_patch: function to patch
+    :param patch: function patched
+    :param family: a category, anything to classify the patch
+    """
+    __slots__ = ("depends_on", "family", "function_to_patch", "patch")
+    def __init__(
+        self, function_to_patch: Union[str, Callable], patch: Callable, family: str = ""
+    ):
+        assert callable(function_to_patch) or isinstance(function_to_patch, str), (
+            f"function_to_patch is not a function but {type(function_to_patch)} "
+            f"- {function_to_patch!r}"
+        )
+        assert callable(patch), (
+            f"function_to_patch is not a function but {type(patch)} - {patch!r}, "
+            f"function_to_patch={function_to_patch!r}"
+        )
+        assert not callable(function_to_patch) or not function_to_patch.__name__.startswith(
+            "patched_"
+        ), (
+            f"A patch was probably not removed because function_to_patch="
+            f"{function_to_patch!r} and patch={patch!r}"
+        )
+        self.family = family
+        self.function_to_patch = function_to_patch
+        self.patch = patch
+        self.depends_on: List[PatchInfo] = []
+    def add_dependency(self, patch_info: "PatchInfo"):
+        self.depends_on.append(patch_info)
+    def __repr__(self) -> str:
+        "usual"
+        return (
+            (
+                f"{self.__class__.__name__}({self.function_to_patch!r}, {self.patch!r}, "
+                f"{self.family!r})"
+            )
+            if self.family
+            else f"{self.__class__.__name__}({self.function_to_patch!r}, {self.patch!r})"
+        )
+    def to_tuple(self) -> Tuple[str, Callable, Callable]:
+        "usual"
+        return (self.family, self.function_to_patch, self.patch)
+    def to_dict(self) -> Dict[str, Any]:
+        "usual"
+        return {k: getattr(self, k) for k in self.__slots__}
+    def make_diff(self) -> str:
+        """Returns a diff as a string."""
+        if isinstance(self.function_to_patch, str):
+            return clean_code_with_black(inspect.getsource(self.patch))
+        src1 = clean_code_with_black(inspect.getsource(self.function_to_patch))
+        src2 = clean_code_with_black(inspect.getsource(self.patch))
+        diff = make_diff_code(src1, src2)
+        if not self.depends_on:
+            return diff
+        res = [diff]
+        for d in self.depends_on:
+            res.append("")
+            res.append(d.make_diff())
+        return "\n".join(res)
+    @classmethod
+    def function_name(cls, f: Callable) -> str:
+        return f.__qualname__
+    def format_diff(self, format: str = "raw") -> str:
+        """
+        Format a diff between two function as a string.
+        :param format: ``'raw'`` or ``'rst'``
+        :return: diff
+        .. runpython::
+            :showcode:
+            :rst:
+            import transformers
+            import onnx_diagnostic.torch_export_patches.patches.patch_transformers as ptr
+            from onnx_diagnostic.torch_export_patches.patch_details import PatchInfo
+            from onnx_diagnostic.torch_export_patches.patches.patch_transformers import (
+                patched_eager_mask,
+            )
+            eager_mask = transformers.masking_utils.eager_mask
+            diff = PatchInfo(eager_mask, patched_eager_mask).format_diff(format="rst")
+            print(diff)
+        """
+        diff = self.make_diff()
+        kind = self.family or ""
+        if kind:
+            kind = f"{kind}: "
+        function_to_pach_name = (
+            f"{self.function_to_patch!r}"
+            if isinstance(self.function_to_patch, str)
+            else self.function_name(self.function_to_patch)
+        )
+        patch_name = self.function_name(self.patch)
+        title = f"{kind}{function_to_pach_name} -> {patch_name}"
+        if format == "raw":
+            return f"{title}\n{diff}"
+        rows = [
+            title,
+            "=" * len(title),
+            "",
+            ".. code-block:: diff",
+            "    :linenos:",
+            "",
+            textwrap.indent(diff, prefix="    "),
+        ]
+        return "\n".join(rows)
+class PatchDetails:
+    """
+    This class is used to store patching information.
+    This helps understanding which rewriting was applied to which
+    method of functions. Page :ref:`l-patch-diff` contains all the
+    diff for all the implemented patches.
+    .. runpython::
+        :showcode:
+        :rst:
+        import torch
+        from onnx_diagnostic.torch_export_patches import torch_export_patches
+        from onnx_diagnostic.torch_export_patches.patch_inputs import use_dyn_not_str
+        from onnx_diagnostic.torch_export_patches.patch_details import PatchDetails
+        from onnx_diagnostic.torch_models.hghub import get_untrained_model_with_inputs
+        data = get_untrained_model_with_inputs("arnir0/Tiny-LLM", verbose=0)
+        model, inputs, ds = data["model"], data["inputs"], data["dynamic_shapes"]
+        details = PatchDetails()
+        with torch_export_patches(
+            patch_transformers=True, patch_details=details, patch_torch=False
+        ):
+            ep = torch.export.export(
+                model, (), kwargs=inputs, dynamic_shapes=use_dyn_not_str(ds)
+            )
+        patches = details.patches_involded_in_graph(ep.graph)
+        report = details.make_report(patches, format="rst")
+        print(report)
+    """
+    def __init__(self):
+        self.patched = []
+        self.find_cache = {}
+    def find(self, name: str) -> Optional[PatchInfo]:
+        "Finds a patch by name."
+        if name in self.find_cache:
+            return self.find_cache[name]
+        for p in self.patched:
+            if p.patch.__name__ == name:
+                self.find_cache[name] = p
+                return p
+        return None
+    def append(
+        self, family: str, function_to_patch: Union[str, Callable], patch: Callable
+    ) -> PatchInfo:
+        """
+        Stores a patch.
+        :param family: a category, anything to classify the patch
+        :param function_to_patch: function to patch
+        :param patch: function patched
+        :return: instance of PatchInfo
+        """
+        p = PatchInfo(function_to_patch, patch, family=family)
+        self.patched.append(p)
+        return p
+    @property
+    def n_patches(self) -> int:
+        "Returns the number of stored patches."
+        # Overwritten __len__ may have an impact on bool(patch_details: PatchDetails)
+        return len(self.patched)
+    def data(self) -> List[Dict[str, Any]]:
+        """Returns the data for a dataframe."""
+        return [p.to_dict() for p in self.patched]
+    def patches_involded_in_graph(
+        self, graph: "torch.fx.Graph"  # noqa: F821
+    ) -> List[Tuple[PatchInfo, List["torch.fx.Node"]]]:  # noqa: F821
+        """
+        Enumerates all patches impacting a graph.
+        The function goes through the graph node (only the main graph) and
+        looks into the metadata to determine if a listed patch was involved.
+        :param graph: fx graph
+        :return: list of nodes impacted by a patch
+        """
+        patches = []
+        for patch in self.patched:
+            f = patch.patch
+            source = inspect.getsourcefile(f)
+            lines, lineno = inspect.getsourcelines(f)
+            interval = [lineno, lineno + len(lines)]
+            patches.append((patch, f, source, interval))
+        cst = "onnx_diagnostic"
+        node_stack = []
+        for node in graph.nodes:
+            meta = node.meta
+            if "stack_trace" not in meta:
+                continue
+            stack = meta["stack_trace"]
+            if cst not in stack:
+                # to reduce the cost of the next iteration
+                continue
+            node_stack.append((node, stack))
+        patch_node = []
+        patched_nodes = set()
+        for patch, _f, source, interval in patches:
+            exp = 'File "([^"]*?%s[^"]+?)", line (\\d+)' % cst
+            reg = re.compile(exp)
+            for node, stack in node_stack:
+                occ = reg.findall(stack)
+                if not occ:
+                    continue
+                for filename, line_number in occ:
+                    if source.replace("\\", "/").strip("/") != filename.replace(
+                        "\\", "/"
+                    ).strip("/"):
+                        continue
+                    line = int(line_number)
+                    if (
+                        line >= interval[0]
+                        and line <= interval[1]
+                        and self.matching_pair(patch, node)
+                    ):
+                        patch_node.append((patch, node))
+                        patched_nodes.add(id(node))
+        # checks all patches were discovered
+        for node, _ in node_stack:
+            assert id(node) in patched_nodes, (
+                f"One node was patched but no patch was found:\n"
+                f"node: {node.target}({','.join(map(str, node.args))}) -> {node.name}"
+                f"\n--\n{pprint.pformat(node.meta)}"
+            )
+        res = {}  # type: ignore[var-annotated]
+        for patch, node in patch_node:
+            if patch not in res:
+                res[patch] = []
+            res[patch].append(node)
+        return list(res.items())
+    def matching_pair(cls, patch: PatchInfo, node: "torch.fx.Node") -> bool:  # noqa: F821
+        """
+        Last validation for a pair. RotaryEmbedding has many rewriting
+        and they all end up in the same code line.
+        """
+        cls_name = patch.function_to_patch.__qualname__.split(".")[0]
+        if not cls_name.endswith("RotaryEmbedding"):
+            return True
+        return cls_name in str(node.meta)
+    def make_report(
+        cls,
+        patches: List[Tuple[PatchInfo, List["torch.fx.Node"]]],  # noqa: F821
+        format: str = "raw",
+    ) -> str:
+        """
+        Creates a report based on the involved patches.
+        :param patches: from method :meth:`patches_involded_in_graph`
+        :param format: format of the report
+        :return: report
+        """
+        rows = []
+        for patch, nodes in patches:
+            rows.append(patch.format_diff(format=format))
+            rows.append("")
+            if format == "rst":
+                rows.extend(["", "", "**impacted nodes**", "", "", ".. code-block::", ""])
+            for node in nodes:
+                rows.append(
+                    f"    {node.target}({', '.join(map(str,node.args))}) -> {node.name}"
+                )
+            rows.append("")
+        return "\n".join(rows)

onnx_diagnostic/torch_export_patches/patch_inputs.py CHANGED Viewed

@@ -38,7 +38,7 @@ def _make_shape(subset: Dict, cls: type, value: Any) -> Any:
         for v in subset.values():
             axes = v
             break
-        new_shape = [[axes for i in range(cache_length)], [axes for i in range(cache_length)]]
+        new_shape = [axes for i in range(cache_length * 2)]
         return new_shape
     if value.__class__ in torch.utils._pytree.SUPPORTED_NODES:
         raise NotImplementedError(

onnx_diagnostic/torch_export_patches/patch_module.py CHANGED Viewed

@@ -1,7 +1,6 @@
 import ast
 import copy
 import contextlib
-import difflib
 import inspect
 import os
 import types
@@ -9,6 +8,7 @@ import textwrap
 import sys
 from typing import Callable, Dict, List, Set, Optional, Tuple, Union
 from .patch_module_helper import code_needing_rewriting
+from .patch_details import PatchDetails, make_diff_code, clean_code_with_black
 NODE_TYPES = tuple(
     getattr(ast, k)
@@ -881,6 +881,7 @@ def torch_export_rewrite(
     ] = None,
     dump_rewriting: Optional[str] = None,
     verbose: int = 0,
+    patch_details: Optional[PatchDetails] = None,
 ):
     """
     Automatically rewrite the methods given in `rewrite` to export
@@ -897,6 +898,8 @@ def torch_export_rewrite(
     :param verbose: verbosity, up to 10, 10 shows the rewritten code,
         ``verbose=1`` shows the rewritten function,
         ``verbose=2`` shows the rewritten code as well
+    :param patch_details: to store any applied patch and get a better understanding
+        of the applied modifications
     Example:
@@ -1019,7 +1022,7 @@ def torch_export_rewrite(
             if verbose:
                 print(f"[torch_export_rewrite] dump original code in {filename1!r}")
             with open(filename1, "w") as f:
-                code = _clean_code(inspect.getsource(to_rewrite))
+                code = clean_code_with_black(inspect.getsource(to_rewrite))
                 f.write(code)
         rewr = transform_method(to_rewrite, verbose=max(verbose - 1, 0), **kws)
         if dump_rewriting:
@@ -1027,10 +1030,12 @@ def torch_export_rewrite(
             if verbose:
                 print(f"[torch_export_rewrite] dump rewritten code in {filename2!r}")
             with open(filename2, "w") as f:
-                rcode = _clean_code(rewr.code)
+                rcode = clean_code_with_black(rewr.code)
                 f.write(rcode)
             diff = os.path.join(dump_rewriting, f"{kind}.{cls_name}.{name}.diff")
-            make_diff(code, rcode, diff)
+            make_diff_code(code, rcode, diff)
+        if patch_details:
+            patch_details.append("rewrite", getattr(cls, name), rewr.func)
         setattr(cls, name, rewr.func)
     try:
@@ -1040,35 +1045,3 @@ def torch_export_rewrite(
             if verbose:
                 print(f"[torch_export_rewrite] restored {kind} {cls.__name__}.{name}")
             setattr(cls, name, me)
-def _clean_code(code: str) -> str:
-    try:
-        import black
-    except ImportError:
-        return code
-    return black.format_str(code, mode=black.FileMode(line_length=98))
-def make_diff(code1: str, code2: str, output: Optional[str] = None) -> str:
-    """
-    Creates a diff between two codes.
-    :param code1: first code
-    :param code2: second code
-    :param output: if not empty, stores the output in this file
-    :return: diff
-    """
-    text = "\n".join(
-        difflib.unified_diff(
-            code1.strip().splitlines(),
-            code2.strip().splitlines(),
-            fromfile="original",
-            tofile="rewritten",
-            lineterm="",
-        )
-    )
-    if output:
-        with open(output, "w") as f:
-            f.write(text)
-    return text

onnx_diagnostic/torch_export_patches/patches/patch_torch.py CHANGED Viewed

@@ -195,9 +195,12 @@ class patched_ShapeEnv:
         if self.frozen:
             self.counter["ignored_backward_guard"] += 1
             # PATCHED: raised an exception instead of logging.
+            import transformers
             raise AssertionError(
                 f"[patched_ShapeEnv] Ignored guard {expr} == {concrete_val}, "
-                f"this could result in accuracy problems"
+                f"this could result in accuracy problems, transformers.__version__="
+                f"{transformers.__version__!r}"
             )
     def _set_replacement(
@@ -683,7 +686,7 @@ class patched_ShapeEnv:
         return concrete_val
-def patched_vmap(func, in_dims=0, out_dims=0):
+def patched_vmap(func, in_dims=0, out_dims=0, use_scan: bool = False):
     """
     Python implementation of :func:`torch.vmap`.
     The implementation raises an issue when it is being exported with
@@ -724,8 +727,9 @@ def patched_vmap(func, in_dims=0, out_dims=0):
             arg = arg.movedim(in_dim, 0)
             batched_args.append(arg)
-        if all(isinstance(a, torch.Tensor) for a in args) and isinstance(
-            batch_size, torch.SymInt
+        if use_scan or (
+            all(isinstance(a, torch.Tensor) for a in args)
+            and isinstance(batch_size, torch.SymInt)
         ):
             batched_tensors = [
                 (
@@ -735,7 +739,9 @@ def patched_vmap(func, in_dims=0, out_dims=0):
                 )
                 for arg, in_dim in zip(batched_args, in_dims_)
             ]
-            results = torch.ops.higher_order.scan(func, [], batched_tensors, [])
+            results = torch.ops.higher_order.scan(
+                lambda *args, **kwargs: [func(*args, **kwargs)], [], batched_tensors, []
+            )
             stacked = results[0]
             if out_dims != 0:
                 return stacked.movedim(0, out_dims)
@@ -745,7 +751,7 @@ def patched_vmap(func, in_dims=0, out_dims=0):
             torch._check(
                 not isinstance(batch_size, torch.SymInt),
                 lambda: (
-                    f"patched_vmap supports dynamic batch_size only if all argument "
+                    f"patched_vmap supports dynamic batch_size only if all arguments "
                     f"are tensors but types are {[type(a) for a in args]}"
                 ),
             )

onnx-diagnostic 0.7.16__py3-none-any.whl → 0.8.1__py3-none-any.whl

onnx-diagnostic 0.7.16py3-none-any.whl → 0.8.1py3-none-any.whl