PyPI - emx-onnx-cgen - Versions diffs - 0.3.0__py3-none-any.whl → 0.3.2__py3-none-any.whl - Mend

emx-onnx-cgen 0.3.0py3-none-any.whl → 0.3.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (94) hide show

emx_onnx_cgen/_build_info.py +1 -1
emx_onnx_cgen/_version.py +2 -2
emx_onnx_cgen/cli.py +50 -23
emx_onnx_cgen/codegen/__init__.py +2 -0
emx_onnx_cgen/codegen/c_emitter.py +1844 -1568
emx_onnx_cgen/codegen/emitter.py +5 -0
emx_onnx_cgen/compiler.py +30 -387
emx_onnx_cgen/ir/context.py +87 -0
emx_onnx_cgen/ir/op_base.py +193 -0
emx_onnx_cgen/ir/op_context.py +65 -0
emx_onnx_cgen/ir/ops/__init__.py +130 -0
emx_onnx_cgen/ir/ops/elementwise.py +146 -0
emx_onnx_cgen/ir/ops/misc.py +421 -0
emx_onnx_cgen/ir/ops/nn.py +580 -0
emx_onnx_cgen/ir/ops/reduce.py +95 -0
emx_onnx_cgen/lowering/__init__.py +79 -1
emx_onnx_cgen/lowering/adagrad.py +114 -0
emx_onnx_cgen/lowering/arg_reduce.py +1 -1
emx_onnx_cgen/lowering/attention.py +1 -1
emx_onnx_cgen/lowering/average_pool.py +1 -1
emx_onnx_cgen/lowering/batch_normalization.py +1 -1
emx_onnx_cgen/lowering/cast.py +1 -1
emx_onnx_cgen/lowering/common.py +36 -18
emx_onnx_cgen/lowering/concat.py +1 -1
emx_onnx_cgen/lowering/constant_of_shape.py +1 -1
emx_onnx_cgen/lowering/conv.py +1 -1
emx_onnx_cgen/lowering/conv_transpose.py +1 -1
emx_onnx_cgen/lowering/cumsum.py +1 -1
emx_onnx_cgen/lowering/depth_space.py +1 -1
emx_onnx_cgen/lowering/dropout.py +1 -1
emx_onnx_cgen/lowering/einsum.py +1 -1
emx_onnx_cgen/lowering/elementwise.py +152 -4
emx_onnx_cgen/lowering/expand.py +1 -1
emx_onnx_cgen/lowering/eye_like.py +1 -1
emx_onnx_cgen/lowering/flatten.py +1 -1
emx_onnx_cgen/lowering/gather.py +1 -1
emx_onnx_cgen/lowering/gather_elements.py +1 -1
emx_onnx_cgen/lowering/gather_nd.py +1 -1
emx_onnx_cgen/lowering/gemm.py +1 -1
emx_onnx_cgen/lowering/global_max_pool.py +1 -1
emx_onnx_cgen/lowering/grid_sample.py +1 -1
emx_onnx_cgen/lowering/group_normalization.py +1 -1
emx_onnx_cgen/lowering/hardmax.py +1 -1
emx_onnx_cgen/lowering/identity.py +1 -1
emx_onnx_cgen/lowering/instance_normalization.py +1 -1
emx_onnx_cgen/lowering/layer_normalization.py +1 -1
emx_onnx_cgen/lowering/logsoftmax.py +1 -1
emx_onnx_cgen/lowering/lp_normalization.py +1 -1
emx_onnx_cgen/lowering/lp_pool.py +1 -1
emx_onnx_cgen/lowering/lrn.py +1 -1
emx_onnx_cgen/lowering/lstm.py +1 -1
emx_onnx_cgen/lowering/matmul.py +1 -1
emx_onnx_cgen/lowering/maxpool.py +1 -1
emx_onnx_cgen/lowering/mean_variance_normalization.py +1 -1
emx_onnx_cgen/lowering/negative_log_likelihood_loss.py +1 -1
emx_onnx_cgen/lowering/non_max_suppression.py +157 -0
emx_onnx_cgen/lowering/nonzero.py +1 -1
emx_onnx_cgen/lowering/one_hot.py +1 -1
emx_onnx_cgen/lowering/pad.py +1 -1
emx_onnx_cgen/lowering/qlinear_matmul.py +212 -0
emx_onnx_cgen/lowering/quantize_linear.py +1 -1
emx_onnx_cgen/lowering/range.py +1 -1
emx_onnx_cgen/lowering/reduce.py +1 -1
emx_onnx_cgen/lowering/registry.py +24 -5
emx_onnx_cgen/lowering/reshape.py +1 -1
emx_onnx_cgen/lowering/resize.py +1 -1
emx_onnx_cgen/lowering/rms_normalization.py +1 -1
emx_onnx_cgen/lowering/rotary_embedding.py +165 -0
emx_onnx_cgen/lowering/scatter_nd.py +1 -1
emx_onnx_cgen/lowering/shape.py +6 -25
emx_onnx_cgen/lowering/size.py +1 -1
emx_onnx_cgen/lowering/slice.py +1 -1
emx_onnx_cgen/lowering/softmax.py +1 -1
emx_onnx_cgen/lowering/softmax_cross_entropy_loss.py +1 -1
emx_onnx_cgen/lowering/split.py +1 -1
emx_onnx_cgen/lowering/squeeze.py +1 -1
emx_onnx_cgen/lowering/tensor_scatter.py +110 -0
emx_onnx_cgen/lowering/tile.py +1 -1
emx_onnx_cgen/lowering/topk.py +25 -7
emx_onnx_cgen/lowering/transpose.py +1 -1
emx_onnx_cgen/lowering/trilu.py +1 -1
emx_onnx_cgen/lowering/unsqueeze.py +1 -1
emx_onnx_cgen/lowering/variadic.py +1 -1
emx_onnx_cgen/lowering/where.py +1 -1
emx_onnx_cgen/runtime/evaluator.py +325 -1
emx_onnx_cgen/verification.py +9 -39
{emx_onnx_cgen-0.3.0.dist-info → emx_onnx_cgen-0.3.2.dist-info}/METADATA +8 -7
emx_onnx_cgen-0.3.2.dist-info/RECORD +107 -0
{emx_onnx_cgen-0.3.0.dist-info → emx_onnx_cgen-0.3.2.dist-info}/WHEEL +1 -1
shared/scalar_functions.py +11 -0
shared/ulp.py +17 -0
emx_onnx_cgen-0.3.0.dist-info/RECORD +0 -93
{emx_onnx_cgen-0.3.0.dist-info → emx_onnx_cgen-0.3.2.dist-info}/entry_points.txt +0 -0
{emx_onnx_cgen-0.3.0.dist-info → emx_onnx_cgen-0.3.2.dist-info}/top_level.txt +0 -0

emx_onnx_cgen/_build_info.py CHANGED Viewed

@@ -1,3 +1,3 @@
 """Auto-generated by build backend. Do not edit."""
-BUILD_DATE = '2026-01-20T17:39:52Z'
+BUILD_DATE = '2026-01-23T03:11:42Z'
 GIT_VERSION = 'unknown'

emx_onnx_cgen/_version.py CHANGED Viewed

@@ -28,7 +28,7 @@ version_tuple: VERSION_TUPLE
 commit_id: COMMIT_ID
 __commit_id__: COMMIT_ID
-__version__ = version = '0.3.0'
-__version_tuple__ = version_tuple = (0, 3, 0)
+__version__ = version = '0.3.2'
+__version_tuple__ = version_tuple = (0, 3, 2)
 __commit_id__ = commit_id = None

emx_onnx_cgen/cli.py CHANGED Viewed

@@ -178,10 +178,10 @@ def _build_parser() -> argparse.ArgumentParser:
     compile_parser.add_argument(
         "--large-weight-threshold",
         type=int,
-        default=1024,
+        default=1024 * 1024,
         help=(
             "Store weights larger than this element count in a binary file "
-            "(default: 1024)"
+            "(default: 1048576; set to 0 to disable)"
         ),
     )
     add_restrict_flags(compile_parser)
@@ -251,6 +251,15 @@ def _build_parser() -> argparse.ArgumentParser:
         default=100,
         help="Maximum allowed ULP difference for floating outputs (default: 100)",
     )
+    verify_parser.add_argument(
+        "--runtime",
+        choices=("onnxruntime", "onnx-reference"),
+        default="onnx-reference",
+        help=(
+            "Runtime backend for verification (default: onnx-reference; "
+            "options: onnxruntime, onnx-reference)"
+        ),
+    )
     add_restrict_flags(verify_parser)
     return parser
@@ -361,9 +370,6 @@ def _resolve_compiler(cc: str | None, prefer_ccache: bool = False) -> list[str]
 def _handle_verify(args: argparse.Namespace) -> int:
-    import numpy as np
-    import onnxruntime as ort
     success_message, error, _operators = _verify_model(
         args, include_build_details=True
     )
@@ -381,7 +387,6 @@ def _verify_model(
     include_build_details: bool,
 ) -> tuple[str | None, str | None, list[str]]:
     import numpy as np
-    import onnxruntime as ort
     def log_step(step: str, started_at: float) -> None:
         duration = time.perf_counter() - started_at
@@ -511,31 +516,44 @@ def _verify_model(
             )
             for name, value in payload["inputs"].items()
         }
+    runtime_name = args.runtime
+    runtime_started = time.perf_counter()
     try:
-        ort_started = time.perf_counter()
-        sess_options = make_deterministic_session_options(ort)
-        sess = ort.InferenceSession(
-            model.SerializeToString(),
-            sess_options=sess_options,
-            providers=["CPUExecutionProvider"],
-        )
-        ort_outputs = sess.run(None, inputs)
+        if runtime_name == "onnxruntime":
+            import onnxruntime as ort
+            sess_options = make_deterministic_session_options(ort)
+            sess = ort.InferenceSession(
+                model.SerializeToString(),
+                sess_options=sess_options,
+                providers=["CPUExecutionProvider"],
+            )
+            runtime_outputs = sess.run(None, inputs)
+        else:
+            from onnx.reference import ReferenceEvaluator
+            evaluator = ReferenceEvaluator(model)
+            runtime_outputs = evaluator.run(None, inputs)
     except Exception as exc:
-        log_step("onnx runtime", ort_started)
+        log_step(runtime_name, runtime_started)
         message = str(exc)
-        if "NOT_IMPLEMENTED" in message:
+        if runtime_name == "onnxruntime" and "NOT_IMPLEMENTED" in message:
             LOGGER.warning(
                 "Skipping verification for %s: ONNX Runtime does not support the model (%s)",
                 model_path,
                 message,
             )
             return "", None, operators
-        return None, f"ONNX Runtime failed to run {model_path}: {message}", operators
-    log_step("onnx runtime", ort_started)
+        return (
+            None,
+            f"{runtime_name} failed to run {model_path}: {message}",
+            operators,
+        )
+    log_step(runtime_name, runtime_started)
     payload_outputs = payload.get("outputs", {})
     max_ulp = 0
     try:
-        for value, ort_out in zip(graph.outputs, ort_outputs):
+        for value, runtime_out in zip(graph.outputs, runtime_outputs):
             output_payload = payload_outputs.get(value.name)
             if output_payload is None:
                 raise AssertionError(f"Missing output {value.name} in testbench data")
@@ -543,12 +561,12 @@ def _verify_model(
             output_data = decode_testbench_array(
                 output_payload["data"], info.np_dtype
             ).astype(info.np_dtype, copy=False)
-            ort_out = ort_out.astype(info.np_dtype, copy=False)
-            output_data = output_data.reshape(ort_out.shape)
+            runtime_out = runtime_out.astype(info.np_dtype, copy=False)
+            output_data = output_data.reshape(runtime_out.shape)
             if np.issubdtype(info.np_dtype, np.floating):
-                max_ulp = max(max_ulp, max_ulp_diff(output_data, ort_out))
+                max_ulp = max(max_ulp, max_ulp_diff(output_data, runtime_out))
             else:
-                np.testing.assert_array_equal(output_data, ort_out)
+                np.testing.assert_array_equal(output_data, runtime_out)
     except AssertionError as exc:
         return None, str(exc), operators
     if max_ulp > args.max_ulp:
@@ -574,6 +592,15 @@ def _load_test_data_inputs(
             "Test data input count does not match model inputs: "
             f"{len(input_files)} vs {len(model.graph.input)}."
         )
+    for value_info in model.graph.input:
+        value_kind = value_info.type.WhichOneof("value")
+        if value_kind != "tensor_type":
+            LOGGER.warning(
+                "Skipping test data load for non-tensor input %s (type %s).",
+                value_info.name,
+                value_kind or "unknown",
+            )
+            return None
     inputs: dict[str, np.ndarray] = {}
     for index, path in enumerate(input_files):
         tensor = onnx.TensorProto()

emx_onnx_cgen/codegen/__init__.py CHANGED Viewed

@@ -7,6 +7,7 @@ from .c_emitter import (
     GemmOp,
     LoweredModel,
     MatMulOp,
+    QLinearMatMulOp,
     ShapeOp,
     UnaryOp,
 )
@@ -20,6 +21,7 @@ __all__ = [
     "GemmOp",
     "LoweredModel",
     "MatMulOp",
+    "QLinearMatMulOp",
     "ShapeOp",
     "UnaryOp",
 ]

emx-onnx-cgen 0.3.0__py3-none-any.whl → 0.3.2__py3-none-any.whl

emx-onnx-cgen 0.3.0py3-none-any.whl → 0.3.2py3-none-any.whl