PyPI - emx-onnx-cgen - Versions diffs - 0.2.0__py3-none-any.whl → 0.3.1__py3-none-any.whl - Mend

emx-onnx-cgen 0.2.0py3-none-any.whl → 0.3.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of emx-onnx-cgen might be problematic. Click here for more details.

Files changed (99) hide show

emx_onnx_cgen/_build_info.py +1 -1
emx_onnx_cgen/_version.py +34 -0
emx_onnx_cgen/cli.py +372 -64
emx_onnx_cgen/codegen/__init__.py +2 -0
emx_onnx_cgen/codegen/c_emitter.py +3932 -1398
emx_onnx_cgen/codegen/emitter.py +5 -0
emx_onnx_cgen/compiler.py +169 -343
emx_onnx_cgen/ir/context.py +87 -0
emx_onnx_cgen/ir/model.py +1 -0
emx_onnx_cgen/ir/op_base.py +193 -0
emx_onnx_cgen/ir/op_context.py +65 -0
emx_onnx_cgen/ir/ops/__init__.py +130 -0
emx_onnx_cgen/ir/ops/elementwise.py +146 -0
emx_onnx_cgen/ir/ops/misc.py +421 -0
emx_onnx_cgen/ir/ops/nn.py +580 -0
emx_onnx_cgen/ir/ops/reduce.py +95 -0
emx_onnx_cgen/lowering/__init__.py +79 -1
emx_onnx_cgen/lowering/adagrad.py +114 -0
emx_onnx_cgen/lowering/arg_reduce.py +1 -1
emx_onnx_cgen/lowering/attention.py +1 -1
emx_onnx_cgen/lowering/average_pool.py +1 -1
emx_onnx_cgen/lowering/batch_normalization.py +1 -1
emx_onnx_cgen/lowering/cast.py +1 -1
emx_onnx_cgen/lowering/common.py +406 -11
emx_onnx_cgen/lowering/concat.py +1 -1
emx_onnx_cgen/lowering/constant_of_shape.py +1 -1
emx_onnx_cgen/lowering/conv.py +1 -1
emx_onnx_cgen/lowering/conv_transpose.py +301 -0
emx_onnx_cgen/lowering/cumsum.py +1 -1
emx_onnx_cgen/lowering/depth_space.py +1 -1
emx_onnx_cgen/lowering/dropout.py +1 -1
emx_onnx_cgen/lowering/einsum.py +153 -0
emx_onnx_cgen/lowering/elementwise.py +152 -4
emx_onnx_cgen/lowering/expand.py +1 -1
emx_onnx_cgen/lowering/eye_like.py +1 -1
emx_onnx_cgen/lowering/flatten.py +1 -1
emx_onnx_cgen/lowering/gather.py +1 -1
emx_onnx_cgen/lowering/gather_elements.py +2 -4
emx_onnx_cgen/lowering/gather_nd.py +79 -0
emx_onnx_cgen/lowering/gemm.py +1 -1
emx_onnx_cgen/lowering/global_max_pool.py +59 -0
emx_onnx_cgen/lowering/grid_sample.py +1 -1
emx_onnx_cgen/lowering/group_normalization.py +1 -1
emx_onnx_cgen/lowering/hardmax.py +53 -0
emx_onnx_cgen/lowering/identity.py +7 -6
emx_onnx_cgen/lowering/instance_normalization.py +1 -1
emx_onnx_cgen/lowering/layer_normalization.py +1 -1
emx_onnx_cgen/lowering/logsoftmax.py +6 -2
emx_onnx_cgen/lowering/lp_normalization.py +1 -1
emx_onnx_cgen/lowering/lp_pool.py +141 -0
emx_onnx_cgen/lowering/lrn.py +1 -1
emx_onnx_cgen/lowering/lstm.py +1 -1
emx_onnx_cgen/lowering/matmul.py +7 -8
emx_onnx_cgen/lowering/maxpool.py +1 -1
emx_onnx_cgen/lowering/mean_variance_normalization.py +1 -1
emx_onnx_cgen/lowering/negative_log_likelihood_loss.py +13 -13
emx_onnx_cgen/lowering/non_max_suppression.py +157 -0
emx_onnx_cgen/lowering/nonzero.py +42 -0
emx_onnx_cgen/lowering/one_hot.py +120 -0
emx_onnx_cgen/lowering/pad.py +1 -1
emx_onnx_cgen/lowering/qlinear_matmul.py +212 -0
emx_onnx_cgen/lowering/quantize_linear.py +126 -0
emx_onnx_cgen/lowering/range.py +1 -1
emx_onnx_cgen/lowering/reduce.py +6 -7
emx_onnx_cgen/lowering/registry.py +24 -5
emx_onnx_cgen/lowering/reshape.py +224 -52
emx_onnx_cgen/lowering/resize.py +1 -1
emx_onnx_cgen/lowering/rms_normalization.py +1 -1
emx_onnx_cgen/lowering/rotary_embedding.py +165 -0
emx_onnx_cgen/lowering/scatter_nd.py +82 -0
emx_onnx_cgen/lowering/shape.py +6 -25
emx_onnx_cgen/lowering/size.py +1 -1
emx_onnx_cgen/lowering/slice.py +1 -1
emx_onnx_cgen/lowering/softmax.py +6 -2
emx_onnx_cgen/lowering/softmax_cross_entropy_loss.py +1 -1
emx_onnx_cgen/lowering/split.py +1 -1
emx_onnx_cgen/lowering/squeeze.py +6 -6
emx_onnx_cgen/lowering/tensor_scatter.py +110 -0
emx_onnx_cgen/lowering/tile.py +1 -1
emx_onnx_cgen/lowering/topk.py +134 -0
emx_onnx_cgen/lowering/transpose.py +1 -1
emx_onnx_cgen/lowering/trilu.py +89 -0
emx_onnx_cgen/lowering/unsqueeze.py +6 -6
emx_onnx_cgen/lowering/variadic.py +1 -1
emx_onnx_cgen/lowering/where.py +1 -1
emx_onnx_cgen/onnx_import.py +4 -0
emx_onnx_cgen/onnxruntime_utils.py +11 -0
emx_onnx_cgen/ops.py +4 -0
emx_onnx_cgen/runtime/evaluator.py +785 -43
emx_onnx_cgen/testbench.py +23 -0
emx_onnx_cgen/verification.py +31 -0
{emx_onnx_cgen-0.2.0.dist-info → emx_onnx_cgen-0.3.1.dist-info}/METADATA +33 -6
emx_onnx_cgen-0.3.1.dist-info/RECORD +107 -0
{emx_onnx_cgen-0.2.0.dist-info → emx_onnx_cgen-0.3.1.dist-info}/WHEEL +1 -1
shared/scalar_functions.py +60 -17
shared/ulp.py +65 -0
emx_onnx_cgen-0.2.0.dist-info/RECORD +0 -76
{emx_onnx_cgen-0.2.0.dist-info → emx_onnx_cgen-0.3.1.dist-info}/entry_points.txt +0 -0
{emx_onnx_cgen-0.2.0.dist-info → emx_onnx_cgen-0.3.1.dist-info}/top_level.txt +0 -0

emx_onnx_cgen/_build_info.py CHANGED Viewed

@@ -1,3 +1,3 @@
 """Auto-generated by build backend. Do not edit."""
-BUILD_DATE = '2026-01-15T22:18:39Z'
+BUILD_DATE = '2026-01-23T02:44:13Z'
 GIT_VERSION = 'unknown'

emx_onnx_cgen/_version.py ADDED Viewed

@@ -0,0 +1,34 @@
+# file generated by setuptools-scm
+# don't change, don't track in version control
+__all__ = [
+    "__version__",
+    "__version_tuple__",
+    "version",
+    "version_tuple",
+    "__commit_id__",
+    "commit_id",
+]
+TYPE_CHECKING = False
+if TYPE_CHECKING:
+    from typing import Tuple
+    from typing import Union
+    VERSION_TUPLE = Tuple[Union[int, str], ...]
+    COMMIT_ID = Union[str, None]
+else:
+    VERSION_TUPLE = object
+    COMMIT_ID = object
+version: str
+__version__: str
+__version_tuple__: VERSION_TUPLE
+version_tuple: VERSION_TUPLE
+commit_id: COMMIT_ID
+__commit_id__: COMMIT_ID
+__version__ = version = '0.3.1'
+__version_tuple__ = version_tuple = (0, 3, 1)
+__commit_id__ = commit_id = None

emx_onnx_cgen/cli.py CHANGED Viewed

@@ -10,18 +10,89 @@ import shutil
 import subprocess
 import sys
 import tempfile
+import time
+import signal
 from pathlib import Path
-from typing import Sequence
+from dataclasses import dataclass
+from typing import TYPE_CHECKING, Mapping, Sequence
 import onnx
+from onnx import numpy_helper
 from ._build_info import BUILD_DATE, GIT_VERSION
 from .compiler import Compiler, CompilerOptions
 from .errors import CodegenError, ShapeInferenceError, UnsupportedOpError
 from .onnx_import import import_onnx
+from .onnxruntime_utils import make_deterministic_session_options
+from .testbench import decode_testbench_array
+from .verification import format_success_message, max_ulp_diff
 LOGGER = logging.getLogger(__name__)
+if TYPE_CHECKING:
+    import numpy as np
+@dataclass(frozen=True)
+class CliResult:
+    exit_code: int
+    command_line: str
+    error: str | None = None
+    success_message: str | None = None
+    generated: str | None = None
+    data_source: str | None = None
+    operators: list[str] | None = None
+def run_cli_command(
+    argv: Sequence[str],
+    *,
+    testbench_inputs: Mapping[str, "np.ndarray"] | None = None,
+) -> CliResult:
+    raw_argv = list(argv)
+    parse_argv = raw_argv
+    if raw_argv and raw_argv[0] == "emx-onnx-cgen":
+        parse_argv = raw_argv[1:]
+    parser = _build_parser()
+    args = parser.parse_args(parse_argv)
+    args.command_line = _format_command_line(raw_argv)
+    try:
+        if args.command != "compile":
+            success_message, error, operators = _verify_model(
+                args, include_build_details=False
+            )
+            return CliResult(
+                exit_code=0 if error is None else 1,
+                command_line=args.command_line,
+                error=error,
+                success_message=success_message,
+                operators=operators,
+            )
+        generated, data_source, error = _compile_model(
+            args, testbench_inputs=testbench_inputs
+        )
+        if error:
+            return CliResult(
+                exit_code=1,
+                command_line=args.command_line,
+                error=error,
+            )
+        return CliResult(
+            exit_code=0,
+            command_line=args.command_line,
+            success_message="",
+            generated=generated,
+            data_source=data_source,
+        )
+    except Exception as exc:  # pragma: no cover - defensive reporting
+        LOGGER.exception("Unhandled exception while running CLI command.")
+        return CliResult(
+            exit_code=1,
+            command_line=args.command_line,
+            error=str(exc),
+        )
 def _build_parser() -> argparse.ArgumentParser:
     description = (
@@ -86,6 +157,33 @@ def _build_parser() -> argparse.ArgumentParser:
             "named like the output with a _data suffix"
         ),
     )
+    compile_parser.add_argument(
+        "--truncate-weights-after",
+        type=int,
+        default=None,
+        help=(
+            "Truncate inline weight initializers after N values and insert "
+            "\"...\" placeholders (default: no truncation)"
+        ),
+    )
+    compile_parser.add_argument(
+        "--large-temp-threshold-bytes",
+        type=int,
+        default=1024,
+        help=(
+            "Mark temporary buffers larger than this threshold as static "
+            "(default: 1024)"
+        ),
+    )
+    compile_parser.add_argument(
+        "--large-weight-threshold",
+        type=int,
+        default=1024 * 1024,
+        help=(
+            "Store weights larger than this element count in a binary file "
+            "(default: 1048576; set to 0 to disable)"
+        ),
+    )
     add_restrict_flags(compile_parser)
     verify_parser = subparsers.add_parser(
@@ -111,6 +209,57 @@ def _build_parser() -> argparse.ArgumentParser:
         default=None,
         help="C compiler command to build the testbench binary",
     )
+    verify_parser.add_argument(
+        "--truncate-weights-after",
+        type=int,
+        default=None,
+        help=(
+            "Truncate inline weight initializers after N values and insert "
+            "\"...\" placeholders (default: no truncation)"
+        ),
+    )
+    verify_parser.add_argument(
+        "--large-temp-threshold-bytes",
+        type=int,
+        default=1024,
+        help=(
+            "Mark temporary buffers larger than this threshold as static "
+            "(default: 1024)"
+        ),
+    )
+    verify_parser.add_argument(
+        "--large-weight-threshold",
+        type=int,
+        default=1024,
+        help=(
+            "Store weights larger than this element count in a binary file "
+            "(default: 1024)"
+        ),
+    )
+    verify_parser.add_argument(
+        "--test-data-dir",
+        type=Path,
+        default=None,
+        help=(
+            "Directory containing input_*.pb files to seed verification inputs "
+            "(default: use random testbench inputs)"
+        ),
+    )
+    verify_parser.add_argument(
+        "--max-ulp",
+        type=int,
+        default=100,
+        help="Maximum allowed ULP difference for floating outputs (default: 100)",
+    )
+    verify_parser.add_argument(
+        "--runtime",
+        choices=("onnxruntime", "onnx-reference"),
+        default="onnx-reference",
+        help=(
+            "Runtime backend for verification (default: onnx-reference; "
+            "options: onnxruntime, onnx-reference)"
+        ),
+    )
     add_restrict_flags(verify_parser)
     return parser
@@ -132,7 +281,35 @@ def main(argv: Sequence[str] | None = None) -> int:
 def _handle_compile(args: argparse.Namespace) -> int:
     model_path: Path = args.model
     output_path: Path = args.output or model_path.with_suffix(".c")
-    model_name = args.model_name or output_path.stem
+    model_name = args.model_name or "model"
+    generated, data_source, weight_data, error = _compile_model(args)
+    if error:
+        LOGGER.error("Failed to compile %s: %s", model_path, error)
+        return 1
+    output_path.parent.mkdir(parents=True, exist_ok=True)
+    output_path.write_text(generated or "", encoding="utf-8")
+    LOGGER.info("Wrote C source to %s", output_path)
+    if data_source is not None:
+        data_path = output_path.with_name(
+            f"{output_path.stem}_data{output_path.suffix}"
+        )
+        data_path.write_text(data_source, encoding="utf-8")
+        LOGGER.info("Wrote data source to %s", data_path)
+    if weight_data is not None:
+        weights_path = output_path.with_name(f"{model_name}.bin")
+        weights_path.write_bytes(weight_data)
+        LOGGER.info("Wrote weights binary to %s", weights_path)
+    return 0
+def _compile_model(
+    args: argparse.Namespace,
+    *,
+    testbench_inputs: Mapping[str, "np.ndarray"] | None = None,
+) -> tuple[str | None, str | None, bytes | None, str | None]:
+    model_path: Path = args.model
+    model_name = args.model_name or "model"
     try:
         model_checksum = _model_checksum(model_path)
         model = onnx.load_model(model_path)
@@ -143,27 +320,22 @@ def _handle_compile(args: argparse.Namespace) -> int:
             command_line=args.command_line,
             model_checksum=model_checksum,
             restrict_arrays=args.restrict_arrays,
+            truncate_weights_after=args.truncate_weights_after,
+            large_temp_threshold_bytes=args.large_temp_threshold_bytes,
+            large_weight_threshold=args.large_weight_threshold,
+            testbench_inputs=testbench_inputs,
         )
         compiler = Compiler(options)
         if args.emit_data_file:
-            generated, data_source = compiler.compile_with_data_file(model)
+            generated, data_source, weight_data = (
+                compiler.compile_with_data_file_and_weight_data(model)
+            )
         else:
-            generated = compiler.compile(model)
+            generated, weight_data = compiler.compile_with_weight_data(model)
             data_source = None
     except (OSError, CodegenError, ShapeInferenceError, UnsupportedOpError) as exc:
-        LOGGER.error("Failed to compile %s: %s", model_path, exc)
-        return 1
-    output_path.parent.mkdir(parents=True, exist_ok=True)
-    output_path.write_text(generated, encoding="utf-8")
-    LOGGER.info("Wrote C source to %s", output_path)
-    if data_source is not None:
-        data_path = output_path.with_name(
-            f"{output_path.stem}_data{output_path.suffix}"
-        )
-        data_path.write_text(data_source, encoding="utf-8")
-        LOGGER.info("Wrote data source to %s", data_path)
-    return 0
+        return None, None, None, str(exc)
+    return generated, data_source, weight_data, None
 def _resolve_compiler(cc: str | None, prefer_ccache: bool = False) -> list[str] | None:
@@ -198,18 +370,59 @@ def _resolve_compiler(cc: str | None, prefer_ccache: bool = False) -> list[str]
 def _handle_verify(args: argparse.Namespace) -> int:
+    success_message, error, _operators = _verify_model(
+        args, include_build_details=True
+    )
+    if error is not None:
+        LOGGER.error("Verification failed: %s", error)
+        return 1
+    if success_message:
+        LOGGER.info("%s", success_message)
+    return 0
+def _verify_model(
+    args: argparse.Namespace,
+    *,
+    include_build_details: bool,
+) -> tuple[str | None, str | None, list[str]]:
     import numpy as np
-    import onnxruntime as ort
+    def log_step(step: str, started_at: float) -> None:
+        duration = time.perf_counter() - started_at
+        LOGGER.info("verify step %s: %.3fs", step, duration)
+    def describe_exit_code(returncode: int) -> str:
+        if returncode >= 0:
+            return f"exit code {returncode}"
+        signal_id = -returncode
+        try:
+            signal_name = signal.Signals(signal_id).name
+        except ValueError:
+            signal_name = "unknown"
+        return f"exit code {returncode} (signal {signal_id}: {signal_name})"
     model_path: Path = args.model
-    model_name = args.model_name or model_path.stem
+    model_name = args.model_name or "model"
     model_checksum = _model_checksum(model_path)
     compiler_cmd = _resolve_compiler(args.cc, prefer_ccache=False)
     if compiler_cmd is None:
-        LOGGER.error("No C compiler found (set --cc or CC environment variable).")
-        return 1
+        return (
+            None,
+            "No C compiler found (set --cc or CC environment variable).",
+            [],
+        )
     try:
         model = onnx.load_model(model_path)
+    except OSError as exc:
+        return None, str(exc), []
+    operators = _collect_model_operators(model)
+    operators_display = ", ".join(operators) if operators else "(none)"
+    LOGGER.info("verify operators: %s", operators_display)
+    try:
+        testbench_inputs = _load_test_data_inputs(model, args.test_data_dir)
         options = CompilerOptions(
             template_dir=args.template_dir,
             model_name=model_name,
@@ -217,100 +430,183 @@ def _handle_verify(args: argparse.Namespace) -> int:
             command_line=args.command_line,
             model_checksum=model_checksum,
             restrict_arrays=args.restrict_arrays,
+            truncate_weights_after=args.truncate_weights_after,
+            large_temp_threshold_bytes=args.large_temp_threshold_bytes,
+            large_weight_threshold=args.large_weight_threshold,
+            testbench_inputs=testbench_inputs,
         )
         compiler = Compiler(options)
-        generated = compiler.compile(model)
-    except (OSError, CodegenError, ShapeInferenceError, UnsupportedOpError) as exc:
-        LOGGER.error("Failed to compile %s: %s", model_path, exc)
-        return 1
+        codegen_started = time.perf_counter()
+        generated, weight_data = compiler.compile_with_weight_data(model)
+        log_step("codegen", codegen_started)
+    except (CodegenError, ShapeInferenceError, UnsupportedOpError) as exc:
+        return None, str(exc), operators
     try:
         graph = import_onnx(model)
         output_dtypes = {value.name: value.type.dtype for value in graph.outputs}
         input_dtypes = {value.name: value.type.dtype for value in graph.inputs}
     except (KeyError, UnsupportedOpError, ShapeInferenceError) as exc:
-        LOGGER.error("Failed to resolve model dtype: %s", exc)
-        return 1
+        return None, f"Failed to resolve model dtype: {exc}", operators
     with tempfile.TemporaryDirectory() as temp_dir:
         temp_path = Path(temp_dir)
+        LOGGER.info("verify temp dir: %s", temp_path)
         c_path = temp_path / "model.c"
+        weights_path = temp_path / f"{model_name}.bin"
         exe_path = temp_path / "model"
         c_path.write_text(generated, encoding="utf-8")
+        if weight_data is not None:
+            weights_path.write_bytes(weight_data)
         try:
+            compile_started = time.perf_counter()
+            compile_cmd = [
+                *compiler_cmd,
+                "-std=c99",
+                "-O2",
+                str(c_path),
+                "-o",
+                str(exe_path),
+                "-lm",
+            ]
+            LOGGER.info("verify compile command: %s", shlex.join(compile_cmd))
             subprocess.run(
-                [
-                    *compiler_cmd,
-                    "-std=c99",
-                    "-O2",
-                    str(c_path),
-                    "-o",
-                    str(exe_path),
-                    "-lm",
-                ],
+                compile_cmd,
                 check=True,
                 capture_output=True,
                 text=True,
             )
+            log_step("compile", compile_started)
         except subprocess.CalledProcessError as exc:
-            LOGGER.error("Failed to build testbench: %s", exc.stderr.strip())
-            return 1
+            message = "Failed to build testbench."
+            if include_build_details:
+                details = exc.stderr.strip()
+                if details:
+                    message = f"{message} {details}"
+            return None, message, operators
         try:
+            run_started = time.perf_counter()
             result = subprocess.run(
                 [str(exe_path)],
                 check=True,
                 capture_output=True,
                 text=True,
+                cwd=temp_path,
             )
+            log_step("run", run_started)
         except subprocess.CalledProcessError as exc:
-            LOGGER.error("Testbench execution failed: %s", exc.stderr.strip())
-            return 1
+            return None, (
+                "Testbench execution failed: " + describe_exit_code(exc.returncode)
+            ), operators
     try:
         payload = json.loads(result.stdout)
     except json.JSONDecodeError as exc:
-        LOGGER.error("Failed to parse testbench JSON: %s", exc)
-        return 1
+        return None, f"Failed to parse testbench JSON: {exc}", operators
-    inputs = {
-        name: np.array(value["data"], dtype=input_dtypes[name].np_dtype)
-        for name, value in payload["inputs"].items()
-    }
-    sess = ort.InferenceSession(
-        model.SerializeToString(), providers=["CPUExecutionProvider"]
-    )
+    if testbench_inputs:
+        inputs = {
+            name: values.astype(input_dtypes[name].np_dtype, copy=False)
+            for name, values in testbench_inputs.items()
+        }
+    else:
+        inputs = {
+            name: decode_testbench_array(
+                value["data"], input_dtypes[name].np_dtype
+            )
+            for name, value in payload["inputs"].items()
+        }
+    runtime_name = args.runtime
+    runtime_started = time.perf_counter()
     try:
-        ort_outputs = sess.run(None, inputs)
+        if runtime_name == "onnxruntime":
+            import onnxruntime as ort
+            sess_options = make_deterministic_session_options(ort)
+            sess = ort.InferenceSession(
+                model.SerializeToString(),
+                sess_options=sess_options,
+                providers=["CPUExecutionProvider"],
+            )
+            runtime_outputs = sess.run(None, inputs)
+        else:
+            from onnx.reference import ReferenceEvaluator
+            evaluator = ReferenceEvaluator(model)
+            runtime_outputs = evaluator.run(None, inputs)
     except Exception as exc:
+        log_step(runtime_name, runtime_started)
         message = str(exc)
-        if "NOT_IMPLEMENTED" in message:
+        if runtime_name == "onnxruntime" and "NOT_IMPLEMENTED" in message:
             LOGGER.warning(
                 "Skipping verification for %s: ONNX Runtime does not support the model (%s)",
                 model_path,
                 message,
             )
-            return 0
-        LOGGER.error("ONNX Runtime failed to run %s: %s", model_path, message)
-        return 1
+            return "", None, operators
+        return (
+            None,
+            f"{runtime_name} failed to run {model_path}: {message}",
+            operators,
+        )
+    log_step(runtime_name, runtime_started)
     payload_outputs = payload.get("outputs", {})
+    max_ulp = 0
     try:
-        for value, ort_out in zip(graph.outputs, ort_outputs):
+        for value, runtime_out in zip(graph.outputs, runtime_outputs):
             output_payload = payload_outputs.get(value.name)
             if output_payload is None:
                 raise AssertionError(f"Missing output {value.name} in testbench data")
             info = output_dtypes[value.name]
-            output_data = np.array(output_payload["data"], dtype=info.np_dtype)
+            output_data = decode_testbench_array(
+                output_payload["data"], info.np_dtype
+            ).astype(info.np_dtype, copy=False)
+            runtime_out = runtime_out.astype(info.np_dtype, copy=False)
+            output_data = output_data.reshape(runtime_out.shape)
             if np.issubdtype(info.np_dtype, np.floating):
-                np.testing.assert_allclose(
-                    output_data, ort_out, rtol=1e-4, atol=1e-5
-                )
+                max_ulp = max(max_ulp, max_ulp_diff(output_data, runtime_out))
             else:
-                np.testing.assert_array_equal(output_data, ort_out)
+                np.testing.assert_array_equal(output_data, runtime_out)
     except AssertionError as exc:
-        LOGGER.error("Verification failed: %s", exc)
-        return 1
-    LOGGER.info("Verification succeeded for %s", model_path)
-    return 0
+        return None, str(exc), operators
+    if max_ulp > args.max_ulp:
+        return None, f"Out of tolerance (max ULP {max_ulp})", operators
+    return format_success_message(max_ulp), None, operators
+def _load_test_data_inputs(
+    model: onnx.ModelProto, data_dir: Path | None
+) -> dict[str, "np.ndarray"] | None:
+    if data_dir is None:
+        return None
+    if not data_dir.exists():
+        raise CodegenError(f"Test data directory not found: {data_dir}")
+    input_files = sorted(
+        data_dir.glob("input_*.pb"),
+        key=lambda path: int(path.stem.split("_")[-1]),
+    )
+    if not input_files:
+        raise CodegenError(f"No input_*.pb files found in {data_dir}")
+    if len(input_files) != len(model.graph.input):
+        raise CodegenError(
+            "Test data input count does not match model inputs: "
+            f"{len(input_files)} vs {len(model.graph.input)}."
+        )
+    for value_info in model.graph.input:
+        value_kind = value_info.type.WhichOneof("value")
+        if value_kind != "tensor_type":
+            LOGGER.warning(
+                "Skipping test data load for non-tensor input %s (type %s).",
+                value_info.name,
+                value_kind or "unknown",
+            )
+            return None
+    inputs: dict[str, np.ndarray] = {}
+    for index, path in enumerate(input_files):
+        tensor = onnx.TensorProto()
+        tensor.ParseFromString(path.read_bytes())
+        inputs[model.graph.input[index].name] = numpy_helper.to_array(tensor)
+    return inputs
 def _format_command_line(argv: Sequence[str] | None) -> str:
@@ -326,3 +622,15 @@ def _model_checksum(model_path: Path) -> str:
     digest = hashlib.sha256()
     digest.update(model_path.read_bytes())
     return digest.hexdigest()
+def _collect_model_operators(model: onnx.ModelProto) -> list[str]:
+    operators: list[str] = []
+    seen: set[str] = set()
+    for node in model.graph.node:
+        op_name = f"{node.domain}::{node.op_type}" if node.domain else node.op_type
+        if op_name in seen:
+            continue
+        seen.add(op_name)
+        operators.append(op_name)
+    return operators

emx_onnx_cgen/codegen/__init__.py CHANGED Viewed

@@ -7,6 +7,7 @@ from .c_emitter import (
     GemmOp,
     LoweredModel,
     MatMulOp,
+    QLinearMatMulOp,
     ShapeOp,
     UnaryOp,
 )
@@ -20,6 +21,7 @@ __all__ = [
     "GemmOp",
     "LoweredModel",
     "MatMulOp",
+    "QLinearMatMulOp",
     "ShapeOp",
     "UnaryOp",
 ]

emx-onnx-cgen 0.2.0__py3-none-any.whl → 0.3.1__py3-none-any.whl

Potentially problematic release.

emx-onnx-cgen 0.2.0py3-none-any.whl → 0.3.1py3-none-any.whl