PyPI - onnx-diagnostic - Versions diffs - 0.5.0__py3-none-any.whl → 0.6.1__py3-none-any.whl - Mend

onnx-diagnostic 0.5.0py3-none-any.whl → 0.6.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (43) hide show

onnx_diagnostic/__init__.py +2 -2
onnx_diagnostic/_command_lines_parser.py +39 -1
onnx_diagnostic/api.py +15 -0
onnx_diagnostic/export/dynamic_shapes.py +14 -5
onnx_diagnostic/ext_test_case.py +15 -1
onnx_diagnostic/helpers/args_helper.py +1 -1
onnx_diagnostic/helpers/graph_helper.py +386 -0
onnx_diagnostic/helpers/helper.py +30 -5
onnx_diagnostic/helpers/model_builder_helper.py +349 -0
onnx_diagnostic/helpers/rt_helper.py +69 -1
onnx_diagnostic/helpers/torch_helper.py +2 -0
onnx_diagnostic/reference/__init__.py +1 -0
onnx_diagnostic/reference/torch_evaluator.py +518 -0
onnx_diagnostic/reference/torch_ops/__init__.py +55 -0
onnx_diagnostic/reference/torch_ops/_op_run.py +326 -0
onnx_diagnostic/reference/torch_ops/access_ops.py +84 -0
onnx_diagnostic/reference/torch_ops/binary_ops.py +108 -0
onnx_diagnostic/reference/torch_ops/controlflow_ops.py +118 -0
onnx_diagnostic/reference/torch_ops/generator_ops.py +35 -0
onnx_diagnostic/reference/torch_ops/nn_ops.py +176 -0
onnx_diagnostic/reference/torch_ops/other_ops.py +106 -0
onnx_diagnostic/reference/torch_ops/reduce_ops.py +130 -0
onnx_diagnostic/reference/torch_ops/sequence_ops.py +65 -0
onnx_diagnostic/reference/torch_ops/shape_ops.py +120 -0
onnx_diagnostic/reference/torch_ops/unary_ops.py +86 -0
onnx_diagnostic/tasks/__init__.py +22 -1
onnx_diagnostic/tasks/image_classification.py +2 -2
onnx_diagnostic/tasks/text_generation.py +3 -3
onnx_diagnostic/torch_export_patches/eval/__init__.py +690 -0
onnx_diagnostic/torch_export_patches/eval/model_cases.py +883 -0
onnx_diagnostic/torch_export_patches/onnx_export_errors.py +34 -1
onnx_diagnostic/torch_export_patches/onnx_export_serialization.py +6 -1
onnx_diagnostic/torch_export_patches/patch_module_helper.py +148 -28
onnx_diagnostic/torch_export_patches/patches/patch_torch.py +91 -0
onnx_diagnostic/torch_export_patches/patches/patch_transformers.py +117 -1
onnx_diagnostic/torch_models/hghub/hub_data_cached_configs.py +142 -0
onnx_diagnostic/torch_models/test_helper.py +225 -22
onnx_diagnostic/torch_onnx/runtime_info.py +289 -0
{onnx_diagnostic-0.5.0.dist-info → onnx_diagnostic-0.6.1.dist-info}/METADATA +1 -1
{onnx_diagnostic-0.5.0.dist-info → onnx_diagnostic-0.6.1.dist-info}/RECORD +43 -24
{onnx_diagnostic-0.5.0.dist-info → onnx_diagnostic-0.6.1.dist-info}/WHEEL +1 -1
{onnx_diagnostic-0.5.0.dist-info → onnx_diagnostic-0.6.1.dist-info}/licenses/LICENSE.txt +0 -0
{onnx_diagnostic-0.5.0.dist-info → onnx_diagnostic-0.6.1.dist-info}/top_level.txt +0 -0

onnx_diagnostic/tasks/__init__.py CHANGED Viewed

@@ -39,9 +39,30 @@ def supported_tasks() -> List[str]:
 def reduce_model_config(config: Any, task: str) -> Dict[str, Any]:
     """Reduces a model size."""
+    head_size0 = (
+        config.head_dim
+        if hasattr(config, "head_dim") and config.head_dim
+        else (
+            config.hidden_size // config.num_attention_heads
+            if hasattr(config, "hidden_size") and hasattr(config, "num_attention_heads")
+            else None
+        )
+    )
     tasks = {mod.__TASK__: mod.reduce_model_config for mod in __TASKS__}
     assert task in tasks, f"Task {task!r} not found in {sorted(tasks)}"
-    return tasks[task](config)
+    res = tasks[task](config)
+    if head_size0 and "head_dim" in res:
+        head_size = (
+            config.head_dim
+            if hasattr(config, "head_dim") and config.head_dim
+            else config.hidden_size // config.num_attention_heads
+        )
+        assert head_size0 == head_size or head_size % 16 == 0, (
+            f"head_size should be a multiple of 16 "
+            f"(head_size0={head_size0}), res={res}, "
+            f"config=\n{config}"
+        )
+    return res
 def random_input_kwargs(config: Any, task: str) -> Tuple[Dict[str, Any], Callable]:

onnx_diagnostic/tasks/image_classification.py CHANGED Viewed

@@ -58,8 +58,8 @@ def get_inputs(
     shapes = {
         "pixel_values": {
             0: torch.export.Dim("batch", min=1, max=1024),
-            2: torch.export.Dim("width", min=1, max=4096),
-            3: torch.export.Dim("height", min=1, max=4096),
+            2: "width",
+            3: "height",
         },
     }
     inputs = dict(

onnx_diagnostic/tasks/text_generation.py CHANGED Viewed

@@ -27,7 +27,7 @@ def reduce_model_config(config: Any) -> Dict[str, Any]:
         kwargs = dict(
             num_hidden_layers=min(config.num_hidden_layers, 2),
             intermediate_size=256 if config is None else min(512, config.intermediate_size),
-            hidden_size=256 if config is None else min(256, config.hidden_size),
+            hidden_size=512 if config is None else min(512, config.hidden_size),
             cls_cache="MambaCache",
             state_size=8 if config is None else getattr(config, "state_size", None),
             conv_kernel=4 if config is None else getattr(config, "conv_kernel", None),
@@ -44,8 +44,8 @@ def reduce_model_config(config: Any) -> Dict[str, Any]:
                 else config.num_attention_heads
             ),
             hidden_size=(
-                min(config.hidden_size, 3072 // 4)
-                if config.hidden_size % 4 == 0
+                min(config.hidden_size, 4096 // 4)
+                if config.hidden_size % 64 == 0
                 else config.hidden_size
             ),
         )

onnx-diagnostic 0.5.0__py3-none-any.whl → 0.6.1__py3-none-any.whl

onnx-diagnostic 0.5.0py3-none-any.whl → 0.6.1py3-none-any.whl