PyPI - onnx-diagnostic - Versions diffs - 0.8.0__py3-none-any.whl - Mend

onnx-diagnostic 0.8.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (132) hide show

onnx_diagnostic/__init__.py +7 -0
onnx_diagnostic/__main__.py +4 -0
onnx_diagnostic/_command_lines_parser.py +1141 -0
onnx_diagnostic/api.py +15 -0
onnx_diagnostic/doc.py +100 -0
onnx_diagnostic/export/__init__.py +2 -0
onnx_diagnostic/export/api.py +124 -0
onnx_diagnostic/export/dynamic_shapes.py +1083 -0
onnx_diagnostic/export/shape_helper.py +296 -0
onnx_diagnostic/export/validate.py +173 -0
onnx_diagnostic/ext_test_case.py +1290 -0
onnx_diagnostic/helpers/__init__.py +1 -0
onnx_diagnostic/helpers/_log_helper.py +463 -0
onnx_diagnostic/helpers/args_helper.py +132 -0
onnx_diagnostic/helpers/bench_run.py +450 -0
onnx_diagnostic/helpers/cache_helper.py +687 -0
onnx_diagnostic/helpers/config_helper.py +170 -0
onnx_diagnostic/helpers/doc_helper.py +163 -0
onnx_diagnostic/helpers/fake_tensor_helper.py +273 -0
onnx_diagnostic/helpers/graph_helper.py +386 -0
onnx_diagnostic/helpers/helper.py +1707 -0
onnx_diagnostic/helpers/log_helper.py +2245 -0
onnx_diagnostic/helpers/memory_peak.py +249 -0
onnx_diagnostic/helpers/mini_onnx_builder.py +600 -0
onnx_diagnostic/helpers/model_builder_helper.py +469 -0
onnx_diagnostic/helpers/onnx_helper.py +1200 -0
onnx_diagnostic/helpers/ort_session.py +736 -0
onnx_diagnostic/helpers/rt_helper.py +476 -0
onnx_diagnostic/helpers/torch_helper.py +987 -0
onnx_diagnostic/reference/__init__.py +4 -0
onnx_diagnostic/reference/evaluator.py +254 -0
onnx_diagnostic/reference/ops/__init__.py +1 -0
onnx_diagnostic/reference/ops/op_add_add_mul_mul.py +68 -0
onnx_diagnostic/reference/ops/op_attention.py +60 -0
onnx_diagnostic/reference/ops/op_average_pool_grad.py +63 -0
onnx_diagnostic/reference/ops/op_bias_softmax.py +16 -0
onnx_diagnostic/reference/ops/op_cast_like.py +46 -0
onnx_diagnostic/reference/ops/op_complex.py +26 -0
onnx_diagnostic/reference/ops/op_concat.py +15 -0
onnx_diagnostic/reference/ops/op_constant_of_shape.py +67 -0
onnx_diagnostic/reference/ops/op_fused_matmul.py +31 -0
onnx_diagnostic/reference/ops/op_gather.py +29 -0
onnx_diagnostic/reference/ops/op_gather_elements.py +45 -0
onnx_diagnostic/reference/ops/op_gather_grad.py +12 -0
onnx_diagnostic/reference/ops/op_memcpy_host.py +11 -0
onnx_diagnostic/reference/ops/op_mul_sigmoid.py +23 -0
onnx_diagnostic/reference/ops/op_negxplus1.py +8 -0
onnx_diagnostic/reference/ops/op_qlinear_average_pool.py +40 -0
onnx_diagnostic/reference/ops/op_qlinear_conv.py +102 -0
onnx_diagnostic/reference/ops/op_quick_gelu.py +23 -0
onnx_diagnostic/reference/ops/op_replace_zero.py +13 -0
onnx_diagnostic/reference/ops/op_rotary.py +19 -0
onnx_diagnostic/reference/ops/op_scan.py +65 -0
onnx_diagnostic/reference/ops/op_scatter_elements.py +107 -0
onnx_diagnostic/reference/ops/op_scatternd_of_shape.py +22 -0
onnx_diagnostic/reference/ops/op_simplified_layer_normalization.py +8 -0
onnx_diagnostic/reference/ops/op_skip_layer_normalization.py +13 -0
onnx_diagnostic/reference/ops/op_slice.py +20 -0
onnx_diagnostic/reference/ops/op_transpose_cast.py +16 -0
onnx_diagnostic/reference/ops/op_tri_matrix.py +17 -0
onnx_diagnostic/reference/ort_evaluator.py +652 -0
onnx_diagnostic/reference/quantized_tensor.py +46 -0
onnx_diagnostic/reference/report_results_comparison.py +95 -0
onnx_diagnostic/reference/torch_evaluator.py +669 -0
onnx_diagnostic/reference/torch_ops/__init__.py +56 -0
onnx_diagnostic/reference/torch_ops/_op_run.py +335 -0
onnx_diagnostic/reference/torch_ops/access_ops.py +94 -0
onnx_diagnostic/reference/torch_ops/binary_ops.py +108 -0
onnx_diagnostic/reference/torch_ops/controlflow_ops.py +121 -0
onnx_diagnostic/reference/torch_ops/generator_ops.py +36 -0
onnx_diagnostic/reference/torch_ops/nn_ops.py +196 -0
onnx_diagnostic/reference/torch_ops/other_ops.py +106 -0
onnx_diagnostic/reference/torch_ops/reduce_ops.py +130 -0
onnx_diagnostic/reference/torch_ops/sequence_ops.py +65 -0
onnx_diagnostic/reference/torch_ops/shape_ops.py +121 -0
onnx_diagnostic/reference/torch_ops/unary_ops.py +93 -0
onnx_diagnostic/tasks/__init__.py +90 -0
onnx_diagnostic/tasks/automatic_speech_recognition.py +188 -0
onnx_diagnostic/tasks/data/__init__.py +13 -0
onnx_diagnostic/tasks/data/dummies_imagetext2text_generation_gemma3.onnx +0 -0
onnx_diagnostic/tasks/feature_extraction.py +162 -0
onnx_diagnostic/tasks/fill_mask.py +89 -0
onnx_diagnostic/tasks/image_classification.py +144 -0
onnx_diagnostic/tasks/image_text_to_text.py +581 -0
onnx_diagnostic/tasks/image_to_video.py +127 -0
onnx_diagnostic/tasks/mask_generation.py +143 -0
onnx_diagnostic/tasks/mixture_of_expert.py +79 -0
onnx_diagnostic/tasks/object_detection.py +134 -0
onnx_diagnostic/tasks/sentence_similarity.py +89 -0
onnx_diagnostic/tasks/summarization.py +227 -0
onnx_diagnostic/tasks/text2text_generation.py +230 -0
onnx_diagnostic/tasks/text_classification.py +89 -0
onnx_diagnostic/tasks/text_generation.py +352 -0
onnx_diagnostic/tasks/text_to_image.py +95 -0
onnx_diagnostic/tasks/zero_shot_image_classification.py +128 -0
onnx_diagnostic/torch_export_patches/__init__.py +21 -0
onnx_diagnostic/torch_export_patches/eval/__init__.py +725 -0
onnx_diagnostic/torch_export_patches/eval/model_cases.py +898 -0
onnx_diagnostic/torch_export_patches/onnx_export_errors.py +1098 -0
onnx_diagnostic/torch_export_patches/onnx_export_serialization.py +311 -0
onnx_diagnostic/torch_export_patches/patch_details.py +340 -0
onnx_diagnostic/torch_export_patches/patch_expressions.py +108 -0
onnx_diagnostic/torch_export_patches/patch_inputs.py +211 -0
onnx_diagnostic/torch_export_patches/patch_module.py +1047 -0
onnx_diagnostic/torch_export_patches/patch_module_helper.py +184 -0
onnx_diagnostic/torch_export_patches/patches/__init__.py +0 -0
onnx_diagnostic/torch_export_patches/patches/patch_torch.py +1090 -0
onnx_diagnostic/torch_export_patches/patches/patch_transformers.py +2139 -0
onnx_diagnostic/torch_export_patches/serialization/__init__.py +46 -0
onnx_diagnostic/torch_export_patches/serialization/diffusers_impl.py +34 -0
onnx_diagnostic/torch_export_patches/serialization/transformers_impl.py +313 -0
onnx_diagnostic/torch_models/__init__.py +0 -0
onnx_diagnostic/torch_models/code_sample.py +343 -0
onnx_diagnostic/torch_models/hghub/__init__.py +1 -0
onnx_diagnostic/torch_models/hghub/hub_api.py +422 -0
onnx_diagnostic/torch_models/hghub/hub_data.py +234 -0
onnx_diagnostic/torch_models/hghub/hub_data_cached_configs.py +4905 -0
onnx_diagnostic/torch_models/hghub/model_inputs.py +388 -0
onnx_diagnostic/torch_models/hghub/model_specific.py +76 -0
onnx_diagnostic/torch_models/llms.py +2 -0
onnx_diagnostic/torch_models/untrained/__init__.py +0 -0
onnx_diagnostic/torch_models/untrained/llm_phi2.py +113 -0
onnx_diagnostic/torch_models/untrained/llm_tiny_llm.py +76 -0
onnx_diagnostic/torch_models/validate.py +2124 -0
onnx_diagnostic/torch_onnx/__init__.py +0 -0
onnx_diagnostic/torch_onnx/runtime_info.py +289 -0
onnx_diagnostic/torch_onnx/sbs.py +440 -0
onnx_diagnostic-0.8.0.dist-info/METADATA +213 -0
onnx_diagnostic-0.8.0.dist-info/RECORD +132 -0
onnx_diagnostic-0.8.0.dist-info/WHEEL +5 -0
onnx_diagnostic-0.8.0.dist-info/licenses/LICENSE.txt +19 -0
onnx_diagnostic-0.8.0.dist-info/top_level.txt +1 -0

onnx_diagnostic/helpers/mini_onnx_builder.py ADDED Viewed

@@ -0,0 +1,600 @@
+import ctypes
+import sys
+from typing import Any, Dict, Iterator, List, Optional, Tuple, Union
+import numpy as np
+from onnx import GraphProto, ModelProto, NodeProto, TensorProto
+import onnx.helper as oh
+import torch
+from .onnx_helper import dtype_to_tensor_dtype, tensor_dtype_to_np_dtype, from_array_extended
+from . import string_type
+STORAGE_TYPE = {
+    TensorProto.FLOAT16: np.int16,
+    TensorProto.BFLOAT16: np.int16,
+}
+def proto_from_array(
+    arr: torch.Tensor,
+    name: Optional[str] = None,
+    verbose: int = 0,
+) -> TensorProto:
+    """
+    Converts a torch Tensor into a TensorProto.
+    :param arr: tensor
+    :param verbose: display the type and shape
+    :return: a TensorProto
+    """
+    if not isinstance(arr, torch.Tensor):
+        raise TypeError(f"Unexpected type {type(arr)}.")
+    if arr.is_sparse:
+        raise NotImplementedError(
+            f"Sparse tensor is not supported yet but initializer {name!r} is."
+        )
+    # arr.contiguous() is slow after a transpose, maybe there is a way to optimize this.
+    arr_cpu = arr.cpu() if arr.is_contiguous() else arr.contiguous().cpu()
+    numel = torch.numel(arr_cpu)
+    element_size = arr_cpu.element_size()
+    if arr_cpu.dtype in {torch.bfloat16}:
+        np_arr = arr_cpu
+    elif arr_cpu.data_ptr() == arr.data_ptr():
+        copy = arr_cpu.clone().detach().requires_grad_(False)
+        assert (
+            arr_cpu.data_ptr() == 0 or arr_cpu.data_ptr() != copy.data_ptr()
+        ), f"Pointers are not null and different {arr_cpu.data_ptr()} != {copy.data_ptr()}"
+        np_arr = np.from_dlpack(copy)
+    else:
+        np_arr = np.from_dlpack(arr_cpu.detach())
+    tensor = TensorProto()
+    tensor.dims.extend(arr_cpu.shape)
+    tensor.name = name
+    itype = dtype_to_tensor_dtype(arr_cpu.dtype)
+    assert not hasattr(TensorProto, "INT4") or itype not in {
+        TensorProto.INT4,
+        TensorProto.UINT4,
+    }, f"Type {arr.dtype} is not supported yet for name={name!r}"
+    tensor.data_type = itype
+    if verbose > 1 and numel > 100:
+        print(f"[proto_from_array] {tensor.data_type}[{arr_cpu.shape}]")
+    if isinstance(np_arr, torch.Tensor):
+        byte_data = (ctypes.c_ubyte * numel * element_size).from_address(np_arr.data_ptr())
+        tensor.raw_data = bytes(byte_data)
+        if sys.byteorder == "big":
+            np_dtype = tensor_dtype_to_np_dtype(STORAGE_TYPE[tensor.data_type])
+            np.byteswap(np.frombuffer(tensor.raw_data, dtype=np_dtype), inplace=True)
+    else:
+        tensor.raw_data = np_arr.tobytes()
+        if sys.byteorder == "big":
+            np_dtype = tensor_dtype_to_np_dtype(tensor.data_type)
+            np.byteswap(np.frombuffer(tensor.raw_data, dtype=np_dtype), inplace=True)
+    return tensor
+class MiniOnnxBuilder:
+    """
+    Simplified builder to build very simple model.
+    :param target_opset: opset to specify
+    :param ir_verison: IR version to use
+    :param sep: separator to build output names
+    """
+    def __init__(self, target_opset: int = 18, ir_version: int = 10, sep: str = "___"):
+        self.initializers_dict: Dict[str, Any] = {}
+        self.inputs: List[Any] = []
+        self.outputs: List[Any] = []
+        self.nodes: List[NodeProto] = []
+        self.opsets = {"": target_opset}
+        self.ir_version = ir_version
+        self.sep = sep
+    def append_output_initializer(
+        self,
+        name: str,
+        tensor: Union[np.ndarray, torch.Tensor],
+        randomize: bool = False,
+    ):
+        """
+        Adds an initializer as an output.
+        The initializer name is prefixed by ``t_``.
+        The output name is *name*.
+        If `randomize` is True, the tensor is not stored but replaced by a random generator.
+        """
+        if randomize:
+            dtype = dtype_to_tensor_dtype(tensor.dtype)
+            if dtype in {
+                TensorProto.FLOAT,
+                TensorProto.FLOAT16,
+                TensorProto.DOUBLE,
+                TensorProto.BFLOAT16,
+            }:
+                mini, maxi = tensor.min(), tensor.max()
+                if mini < 0 and maxi > 0:
+                    op_type = "RandomNormal"
+                    kwargs = {
+                        "mean": float(tensor.mean()),
+                        "scale": float(tensor.std()),
+                        "seed": 0.0,
+                    }
+                else:
+                    op_type = "RandomUniform"
+                    kwargs = {
+                        "low": float(mini),
+                        "high": float(maxi),
+                        "seed": 0.0,
+                    }
+                shape = tuple(map(int, tensor.shape))
+                self.nodes.append(
+                    oh.make_node(op_type, [], [name], dtype=dtype, shape=shape, **kwargs)
+                )
+                self.outputs.append(oh.make_tensor_value_info(name, dtype, shape))
+                return
+        init_name = f"t_{name}"
+        assert (
+            init_name not in self.initializers_dict
+        ), f"name={init_name!r} already in {sorted(self.initializers_dict)}"
+        self.initializers_dict[init_name] = tensor
+        shape = tuple(map(int, tensor.shape))
+        self.outputs.append(
+            oh.make_tensor_value_info(name, dtype_to_tensor_dtype(tensor.dtype), shape)
+        )
+        self.nodes.append(oh.make_node("Identity", [init_name], [name]))
+    def append_output_sequence(
+        self, name: str, tensors: List[Union[np.ndarray, torch.Tensor]]
+    ):
+        """
+        Adds a sequence of initializers as an output.
+        The initializers names are prefixed by ``seq_``.
+        The output name is ``name``.
+        """
+        if not tensors:
+            # empty list
+            self.nodes.append(oh.make_node("SequenceEmpty", [], [name]))
+            tensor_type_proto = oh.make_tensor_type_proto(
+                elem_type=TensorProto.FLOAT, shape=None
+            )
+        else:
+            assert all(
+                isinstance(t, (np.ndarray, torch.Tensor)) for t in tensors
+            ), f"Nested sequences are not supported, types are {[type(t) for t in tensors]}"
+            names = []
+            for i, t in enumerate(tensors):
+                init_name = f"seq_{name}_{i}"
+                self.initializers_dict[init_name] = t
+                names.append(init_name)
+            self.nodes.append(oh.make_node("SequenceConstruct", names, [name]))
+            tensor_type_proto = oh.make_tensor_type_proto(
+                elem_type=dtype_to_tensor_dtype(tensors[0].dtype), shape=None
+            )
+        sequence_type_proto = oh.make_sequence_type_proto(tensor_type_proto)
+        output = oh.make_value_info(name, type_proto=sequence_type_proto)
+        self.outputs.append(output)
+    def append_output_dict(
+        self, name: str, tensors: Dict[str, Union[np.ndarray, torch.Tensor]]
+    ):
+        """
+        Adds two outputs, a string tensors for the keys and a sequence of tensors
+        for the values.
+        The output name is ``name___keys`` and ``name___values``.
+        """
+        keys = []
+        values = []
+        for k, v in tensors.items():
+            keys.append(k)
+            values.append(v)
+        self.append_output_initializer(f"{name}{self.sep}keys", np.array(keys, dtype=np.str_))
+        self.append_output_sequence(f"{name}{self.sep}values", values)
+    def _build_initializers(self, switch_low_high: bool) -> List[TensorProto]:
+        """
+        Builds initializers.
+        :param switch_low_high: invert low, high precision
+        :return: a list of tensors to stored in the model
+        """
+        init_dict = self.initializers_dict
+        if switch_low_high:
+            # Let's try to minimize the time.
+            initializer: List[TensorProto] = []
+            for k, v in init_dict.items():
+                if isinstance(v, TensorProto):
+                    initializer.append(v)
+                    continue
+                if isinstance(v, np.ndarray):
+                    itype = dtype_to_tensor_dtype(v.dtype)
+                    if itype in {
+                        TensorProto.BOOL,
+                        TensorProto.STRING,
+                        TensorProto.UNDEFINED,
+                        TensorProto.COMPLEX64,
+                        TensorProto.COMPLEX128,
+                        getattr(TensorProto, "UINT4", 0),
+                        getattr(TensorProto, "INT4", 0),
+                    }:
+                        t = from_array_extended(v, name=k)
+                        initializer.append(t)
+                        continue
+                    from_np = True
+                elif isinstance(v, np.float32):
+                    t = from_array_extended(np.array([v], dtype=np.float32), name=k)
+                    initializer.append(t)
+                    continue
+                elif isinstance(v, np.float64):
+                    t = from_array_extended(np.array([v], dtype=np.float64), name=k)
+                    initializer.append(t)
+                    continue
+                elif isinstance(v, np.float16):
+                    t = from_array_extended(np.array([v], dtype=np.float16), name=k)
+                    initializer.append(t)
+                    continue
+                else:
+                    assert isinstance(
+                        v, torch.Tensor
+                    ), f"tensor {k!r} has un unexpected type {type(v)}"
+                    assert "FakeTensor" not in str(
+                        type(v)
+                    ), f"tensor {k!r} cannot be a FakeTensor: {type(v)}"
+                    from_np = False
+                    itype = dtype_to_tensor_dtype(v.dtype)
+                # How to avoid a copy?
+                if from_np:
+                    tensor = TensorProto()
+                    tensor.name = k
+                    tensor.dims.extend(v.shape)
+                    tensor.data_type = itype
+                    tensor.raw_data = v.tobytes()
+                else:
+                    tensor = proto_from_array(v, name=k)
+                initializer.append(tensor)
+            return initializer
+        res: List[TensorProto] = []
+        for k, v in init_dict.items():
+            if isinstance(v, TensorProto):
+                res.append(v)
+                continue
+            if isinstance(v, torch.Tensor):
+                # no string tensor
+                t = proto_from_array(v, name=k)
+                res.append(t)
+                continue
+            if isinstance(v, np.ndarray):
+                t = from_array_extended(v, name=k)
+                res.append(t)
+                continue
+            raise TypeError(
+                f"Unable to convert initializer {k!r} with type "
+                f"{type(v)} into a TensorProto."
+            )
+        return res
+    def to_onnx(self) -> ModelProto:
+        """
+        Conversion to onnx.
+        :return: the proto
+        """
+        opsets = [oh.make_opsetid(*o) for o in self.opsets.items()]
+        ir_version = self.ir_version
+        model = ModelProto()
+        model.graph.CopyFrom(GraphProto())
+        model.graph.name = "mini_model"
+        model.graph.input.extend(self.inputs)
+        model.graph.node.extend(self.nodes)
+        model.graph.output.extend(self.outputs)
+        initializers = self._build_initializers(switch_low_high=sys.byteorder != "big")
+        model.graph.initializer.extend(initializers)
+        model.opset_import.extend(opsets)
+        model.ir_version = ir_version
+        return model
+def _flatten_iterator(obj: Any, sep: str) -> Iterator:
+    """Iterates on all object."""
+    if obj is not None:
+        if isinstance(obj, np.ndarray):
+            yield "array", obj
+        elif isinstance(obj, torch.Tensor):
+            yield "tensor", obj
+        elif isinstance(obj, bool):
+            yield "bool", np.array([obj], dtype=np.bool_)
+        elif isinstance(obj, int):
+            yield "int", np.array([obj], dtype=np.int64)
+        elif isinstance(obj, float):
+            yield "float", np.array([obj], dtype=np.float64)
+        elif isinstance(obj, tuple):
+            if not obj:
+                yield f"tuple.{sep}empty", None
+            else:
+                for i, o in enumerate(obj):
+                    if i == len(obj) - 1:
+                        for p, oo in _flatten_iterator(o, sep):
+                            yield f"tuple_{i}.{sep}{p}", oo
+                    else:
+                        for p, oo in _flatten_iterator(o, sep):
+                            yield f"tuple_{i}{sep}{p}", oo
+        elif isinstance(obj, list):
+            if not obj:
+                yield f"list.{sep}empty", None
+            else:
+                for i, o in enumerate(obj):
+                    if i == len(obj) - 1:
+                        for p, oo in _flatten_iterator(o, sep):
+                            yield f"list_{i}.{sep}{p}", oo
+                    else:
+                        for p, oo in _flatten_iterator(o, sep):
+                            yield f"list_{i}{sep}{p}", oo
+        elif isinstance(obj, dict):
+            if not obj:
+                yield f"dict.{sep}empty", None
+            else:
+                for i, (k, v) in enumerate(obj.items()):
+                    assert sep not in k, (
+                        f"Key {k!r} cannot contain '{sep}'. "
+                        f"It would interfere with the serialization."
+                    )
+                    def _mk(k):
+                        if isinstance(k, tuple):
+                            # this assumes the tuple contains simple types
+                            return f"(({','.join(map(str,k))}))"
+                        return str(k)
+                    if i == len(obj) - 1:
+                        for p, o in _flatten_iterator(v, sep):
+                            yield f"dict._{_mk(k)}{sep}{p}", o
+                    else:
+                        for p, o in _flatten_iterator(v, sep):
+                            yield f"dict_{_mk(k)}{sep}{p}", o
+        elif obj.__class__.__name__ == "DynamicCache":
+            # transformers
+            import transformers
+            from .cache_helper import CacheKeyValue
+            assert isinstance(
+                obj, transformers.cache_utils.DynamicCache
+            ), f"Unexpected type {type(obj)}"
+            obj = CacheKeyValue(obj)
+            atts = ["key_cache", "value_cache"]
+            for i, att in enumerate(atts):
+                if i == len(atts) - 1:
+                    for p, o in _flatten_iterator(getattr(obj, att), sep):
+                        yield f"DynamicCache._{att}{sep}{p}", o
+                else:
+                    for p, o in _flatten_iterator(getattr(obj, att), sep):
+                        yield f"DynamicCache_{att}{sep}{p}", o
+        elif obj.__class__.__name__ == "StaticCache":
+            # transformers
+            import transformers
+            from .cache_helper import CacheKeyValue
+            assert isinstance(
+                obj, transformers.cache_utils.StaticCache
+            ), f"Unexpected type {type(obj)}"
+            obj = CacheKeyValue(obj)
+            atts = ["key_cache", "value_cache"]
+            for i, att in enumerate(atts):
+                if i == len(atts) - 1:
+                    for p, o in _flatten_iterator(getattr(obj, att), sep):
+                        yield f"StaticCache._{att}{sep}{p}", o
+                else:
+                    for p, o in _flatten_iterator(getattr(obj, att), sep):
+                        yield f"StaticCache_{att}{sep}{p}", o
+        else:
+            raise NotImplementedError(f"Unexpected type {type(obj)}")
+def create_onnx_model_from_input_tensors(
+    inputs: Any,
+    switch_low_high: Optional[bool] = None,
+    randomize: bool = False,
+    sep: str = "___",
+) -> ModelProto:
+    """
+    Creates a model proto including all the value as initializers.
+    They can be restored by executing the model.
+    We assume these inputs are not bigger than 2Gb,
+    the limit of protobuf. Nothing is implemented yet to get around
+    that limit.
+    :param inputs: anything
+    :param switch_low_high: if None, it is equal to ``switch_low_high=sys.byteorder != "big"``
+    :param randomize: if True, float tensors are not stored but randomized to save space
+    :param sep: separator
+    :return: ModelProto
+    The function raises an error if not supported.
+    """
+    if switch_low_high is None:
+        switch_low_high = sys.byteorder != "big"
+    builder = MiniOnnxBuilder(sep=sep)
+    for prefix, o in _flatten_iterator(inputs, sep):
+        if o is None:
+            builder.append_output_initializer(prefix, np.array([]))
+        else:
+            builder.append_output_initializer(prefix, o, randomize=randomize)
+    model = builder.to_onnx()
+    model.doc_string = string_type(inputs, True, True)
+    return model
+def _unflatten(
+    sep: str,
+    names: List[str],
+    outputs: List[Any],
+    pos: int = 0,
+    level: int = 0,
+    device: str = "cpu",
+) -> Tuple[int, Any]:
+    """Unflattens a list of outputs flattened with :func:`flatten_iterator`."""
+    name = names[pos]
+    spl = name.split(sep)
+    if len(spl) == level + 1:
+        # A tensor.
+        if spl[-1] == "empty":
+            return pos + 1, None
+        if spl[-1] == "bool":
+            return pos + 1, bool(outputs[pos][0])
+        if spl[-1] == "int":
+            return pos + 1, int(outputs[pos][0])
+        if spl[-1] == "float":
+            return pos + 1, float(outputs[pos][0])
+        if spl[-1] == "array":
+            return pos + 1, outputs[pos]
+        if spl[-1] == "tensor":
+            return pos + 1, torch.from_numpy(outputs[pos]).to(device)
+        raise AssertionError(f"Unexpected name {name!r} in {names}")
+    res: List[Any] = []
+    while True:
+        assert pos < len(names), f"Something went wrong with names={names!r}\nres={res!r}"
+        name = names[pos]
+        spl = name.split(sep)
+        prefix = spl[level]
+        next_pos, value = _unflatten(
+            sep, names, outputs, pos=pos, level=level + 1, device=device
+        )
+        if prefix.startswith("DynamicCache"):
+            key = prefix.split("_", maxsplit=1)[-1]
+            res.append((key, value))
+            lp = len("DynamicCache")
+            end = len(prefix) > lp and prefix[lp] == "."
+        elif prefix.startswith("dict"):
+            key = prefix.split("_", maxsplit=1)[-1]
+            res.append((key, value))
+            end = len(prefix) > 4 and prefix[4] == "."
+        else:
+            res.append(value)
+            end = prefix[-1] == "."
+        if end:
+            if prefix.startswith("dict"):
+                ty: type = dict
+            elif prefix.startswith("list"):
+                ty = list
+            elif prefix.startswith("tuple"):
+                ty = tuple
+            elif prefix.startswith("DynamicCache"):
+                from transformers.cache_utils import DynamicCache
+                ty = DynamicCache
+            else:
+                raise AssertionError(f"Unexpected prefix={prefix!r}")
+            break
+        pos = next_pos
+    def _tryint(s):
+        try:
+            return int(s)
+        except (ValueError, TypeError):
+            if s in {"True", "False"}:
+                return s == "True"
+            return s
+    def _make(ty: type, res: Any) -> Any:
+        if ty.__name__ == "DynamicCache":
+            from .cache_helper import CacheKeyValue
+            cc = CacheKeyValue()
+            for k, v in res:
+                setattr(cc, k, v)
+            r = cc.make_dynamic_cache()
+            return r
+        if ty is dict:
+            d = {}
+            for k, v in res:
+                if k.startswith("((") and k.endswith("))"):
+                    spl = k[2:-2].split(",")
+                    key = tuple(_tryint(s) for s in spl)
+                else:
+                    key = _tryint(k)
+                d[key] = v
+            return d
+        return ty(res)
+    return next_pos, (
+        ty() if len(res) == 1 and res[0] in (("dict.", None), None) else _make(ty, res)
+    )
+def create_input_tensors_from_onnx_model(
+    proto: Union[str, ModelProto],
+    device: str = "cpu",
+    engine: str = "ExtendedReferenceEvaluator",
+    sep: str = "___",
+) -> Any:
+    """
+    Deserializes tensors stored with function
+    :func:`create_onnx_model_from_input_tensors`.
+    It relies on :class:`ExtendedReferenceEvaluator
+    <onnx_diagnostic.reference.ExtendedReferenceEvaluator>`
+    to restore the tensors.
+    :param proto: ModelProto or the file itself
+    :param device: moves the tensor to this device
+    :param engine: runtime to use, onnx, the default value, onnxruntime
+    :param sep: separator
+    :return: restored data
+    See example :ref:`l-plot-intermediate-results` for an example.
+    """
+    if engine == "ExtendedReferenceEvaluator":
+        from ..reference import ExtendedReferenceEvaluator
+        sess = ExtendedReferenceEvaluator(proto)
+        names = sess.output_names
+    elif engine == "onnx":
+        from onnx.reference import ReferenceEvaluator
+        sess = ReferenceEvaluator(proto)
+        names = sess.output_names
+    elif engine == "onnxruntime":
+        from onnxruntime import InferenceSession
+        sess = InferenceSession(
+            proto if isinstance(proto, str) else proto.SerializeToString(),
+            providers=["CPUExecutionProvider"],
+        )
+        names = [i.name for i in sess.get_outputs()]
+    else:
+        raise AssertionError(f"Unexpected value for engine={engine!r}")
+    got = sess.run(None, {})
+    if len(names) == 1:
+        name = names[0]
+        output = got[0]
+        if name == "empty":
+            return None
+        if name == "array":
+            return output
+        if name == "bool":
+            return bool(output[0])
+        if name == "int":
+            return int(output[0])
+        if name == "float":
+            return float(output[0])
+        if name == "tensor":
+            return torch.from_numpy(output).to(device)
+        raise AssertionError(f"Unexpected name {name!r} in {names}")
+    return _unflatten(sep, names, got, device=device)[1]