PyPI - tico - Versions diffs - 0.1.0.dev250411__py3-none-any.whl - Mend

tico 0.1.0.dev250411__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (196) hide show

tico/__init__.py +31 -0
tico/config/__init__.py +4 -0
tico/config/base.py +37 -0
tico/config/factory.py +41 -0
tico/config/v1.py +35 -0
tico/experimental/__init__.py +1 -0
tico/experimental/quantization/__init__.py +1 -0
tico/experimental/quantization/algorithm/__init__.py +1 -0
tico/experimental/quantization/algorithm/gptq/__init__.py +1 -0
tico/experimental/quantization/algorithm/gptq/gptq.py +172 -0
tico/experimental/quantization/algorithm/gptq/quant.py +153 -0
tico/experimental/quantization/algorithm/gptq/quantizer.py +225 -0
tico/experimental/quantization/algorithm/gptq/utils.py +65 -0
tico/experimental/quantization/algorithm/pt2e/__init__.py +1 -0
tico/experimental/quantization/algorithm/pt2e/annotation/__init__.py +1 -0
tico/experimental/quantization/algorithm/pt2e/annotation/annotator.py +215 -0
tico/experimental/quantization/algorithm/pt2e/annotation/config.py +26 -0
tico/experimental/quantization/algorithm/pt2e/annotation/op/__init__.py +21 -0
tico/experimental/quantization/algorithm/pt2e/annotation/op/adaptive_avg_pool2d.py +65 -0
tico/experimental/quantization/algorithm/pt2e/annotation/op/add.py +57 -0
tico/experimental/quantization/algorithm/pt2e/annotation/op/conv2d.py +92 -0
tico/experimental/quantization/algorithm/pt2e/annotation/op/div.py +57 -0
tico/experimental/quantization/algorithm/pt2e/annotation/op/linear.py +94 -0
tico/experimental/quantization/algorithm/pt2e/annotation/op/mean.py +53 -0
tico/experimental/quantization/algorithm/pt2e/annotation/op/mul.py +57 -0
tico/experimental/quantization/algorithm/pt2e/annotation/op/relu6.py +53 -0
tico/experimental/quantization/algorithm/pt2e/annotation/op/rsqrt.py +53 -0
tico/experimental/quantization/algorithm/pt2e/annotation/op/sub.py +57 -0
tico/experimental/quantization/algorithm/pt2e/annotation/spec.py +47 -0
tico/experimental/quantization/algorithm/pt2e/annotation/utils.py +88 -0
tico/experimental/quantization/algorithm/pt2e/quantizer.py +78 -0
tico/experimental/quantization/algorithm/pt2e/transformation/__init__.py +1 -0
tico/experimental/quantization/algorithm/pt2e/transformation/convert_scalars_to_attrs.py +58 -0
tico/experimental/quantization/algorithm/pt2e/utils.py +138 -0
tico/experimental/quantization/algorithm/smoothquant/__init__.py +1 -0
tico/experimental/quantization/algorithm/smoothquant/observer.py +78 -0
tico/experimental/quantization/algorithm/smoothquant/quantizer.py +81 -0
tico/experimental/quantization/algorithm/smoothquant/smooth_quant.py +164 -0
tico/experimental/quantization/config.py +68 -0
tico/experimental/quantization/evaluation/__init__.py +1 -0
tico/experimental/quantization/evaluation/backend.py +20 -0
tico/experimental/quantization/evaluation/evaluate.py +223 -0
tico/experimental/quantization/evaluation/executor/__init__.py +1 -0
tico/experimental/quantization/evaluation/executor/backend_executor.py +54 -0
tico/experimental/quantization/evaluation/executor/circle_executor.py +75 -0
tico/experimental/quantization/evaluation/executor/triv24_executor.py +128 -0
tico/experimental/quantization/evaluation/metric.py +109 -0
tico/experimental/quantization/evaluation/utils.py +185 -0
tico/experimental/quantization/passes/__init__.py +1 -0
tico/experimental/quantization/passes/fold_quant_ops.py +97 -0
tico/experimental/quantization/passes/insert_quantize_on_dtype_mismatch.py +289 -0
tico/experimental/quantization/passes/propagate_qparam_backward.py +91 -0
tico/experimental/quantization/passes/propagate_qparam_forward.py +141 -0
tico/experimental/quantization/passes/remove_weight_dequant_op.py +168 -0
tico/experimental/quantization/public_interface.py +108 -0
tico/experimental/quantization/quantizer.py +71 -0
tico/interpreter/__init__.py +1 -0
tico/interpreter/infer.py +116 -0
tico/interpreter/interpreter.py +93 -0
tico/passes/__init__.py +1 -0
tico/passes/cast_aten_where_arg_type.py +185 -0
tico/passes/cast_mixed_type_args.py +186 -0
tico/passes/const_prop_pass.py +307 -0
tico/passes/convert_conv1d_to_conv2d.py +151 -0
tico/passes/convert_layout_op_to_reshape.py +84 -0
tico/passes/convert_repeat_to_expand_copy.py +90 -0
tico/passes/convert_to_relu6.py +180 -0
tico/passes/decompose_addmm.py +127 -0
tico/passes/decompose_batch_norm.py +198 -0
tico/passes/decompose_fake_quantize.py +126 -0
tico/passes/decompose_fake_quantize_tensor_qparams.py +270 -0
tico/passes/decompose_group_norm.py +258 -0
tico/passes/decompose_grouped_conv2d.py +202 -0
tico/passes/decompose_slice_scatter.py +167 -0
tico/passes/extract_dtype_kwargs.py +121 -0
tico/passes/fill_meta_val.py +57 -0
tico/passes/fuse_redundant_reshape_to_mean.py +102 -0
tico/passes/legalize_causal_mask_value.py +113 -0
tico/passes/legalize_predefined_layout_operators.py +383 -0
tico/passes/lower_pow2_to_mul.py +75 -0
tico/passes/lower_to_resize_nearest_neighbor.py +249 -0
tico/passes/lower_to_slice.py +112 -0
tico/passes/merge_consecutive_cat.py +82 -0
tico/passes/ops.py +75 -0
tico/passes/remove_nop.py +85 -0
tico/passes/remove_redundant_assert_nodes.py +50 -0
tico/passes/remove_redundant_expand.py +70 -0
tico/passes/remove_redundant_permute.py +102 -0
tico/passes/remove_redundant_reshape.py +431 -0
tico/passes/remove_redundant_slice.py +64 -0
tico/passes/remove_redundant_to_copy.py +84 -0
tico/passes/restore_linear.py +113 -0
tico/passes/segment_index_select.py +143 -0
tico/pt2_to_circle.py +101 -0
tico/serialize/__init__.py +1 -0
tico/serialize/circle_graph.py +264 -0
tico/serialize/circle_mapping.py +177 -0
tico/serialize/circle_serializer.py +232 -0
tico/serialize/operators/__init__.py +28 -0
tico/serialize/operators/hashable_opcode.py +43 -0
tico/serialize/operators/node_visitor.py +80 -0
tico/serialize/operators/op_add.py +69 -0
tico/serialize/operators/op_alias_copy.py +64 -0
tico/serialize/operators/op_any.py +142 -0
tico/serialize/operators/op_arange_start_step.py +61 -0
tico/serialize/operators/op_argmax.py +62 -0
tico/serialize/operators/op_avg_pool2d.py +112 -0
tico/serialize/operators/op_bmm.py +62 -0
tico/serialize/operators/op_cat.py +66 -0
tico/serialize/operators/op_clamp.py +123 -0
tico/serialize/operators/op_clone.py +71 -0
tico/serialize/operators/op_constant_pad_nd.py +72 -0
tico/serialize/operators/op_conv2d.py +181 -0
tico/serialize/operators/op_copy.py +162 -0
tico/serialize/operators/op_cos.py +59 -0
tico/serialize/operators/op_cumsum.py +92 -0
tico/serialize/operators/op_depthwise_conv2d.py +198 -0
tico/serialize/operators/op_dequantize_per_channel.py +82 -0
tico/serialize/operators/op_dequantize_per_tensor.py +64 -0
tico/serialize/operators/op_div.py +62 -0
tico/serialize/operators/op_embedding.py +60 -0
tico/serialize/operators/op_eq.py +64 -0
tico/serialize/operators/op_exp.py +60 -0
tico/serialize/operators/op_expand.py +91 -0
tico/serialize/operators/op_full.py +48 -0
tico/serialize/operators/op_full_like.py +55 -0
tico/serialize/operators/op_ge.py +54 -0
tico/serialize/operators/op_gelu.py +59 -0
tico/serialize/operators/op_gt.py +54 -0
tico/serialize/operators/op_index.py +82 -0
tico/serialize/operators/op_index_select.py +64 -0
tico/serialize/operators/op_instance_norm.py +91 -0
tico/serialize/operators/op_linear.py +70 -0
tico/serialize/operators/op_log.py +53 -0
tico/serialize/operators/op_log1p.py +83 -0
tico/serialize/operators/op_logical_and.py +63 -0
tico/serialize/operators/op_logical_not.py +62 -0
tico/serialize/operators/op_lt.py +61 -0
tico/serialize/operators/op_max_pool2d_with_indices.py +140 -0
tico/serialize/operators/op_maximum.py +53 -0
tico/serialize/operators/op_mean.py +66 -0
tico/serialize/operators/op_minimum.py +53 -0
tico/serialize/operators/op_mm.py +174 -0
tico/serialize/operators/op_mul.py +99 -0
tico/serialize/operators/op_ne.py +54 -0
tico/serialize/operators/op_neg.py +59 -0
tico/serialize/operators/op_permute.py +65 -0
tico/serialize/operators/op_pow.py +138 -0
tico/serialize/operators/op_prelu.py +54 -0
tico/serialize/operators/op_quantize_per_tensor.py +79 -0
tico/serialize/operators/op_reciprocal.py +64 -0
tico/serialize/operators/op_relu.py +53 -0
tico/serialize/operators/op_relu6.py +52 -0
tico/serialize/operators/op_repeat.py +99 -0
tico/serialize/operators/op_reshape.py +73 -0
tico/serialize/operators/op_resize_nearest_neighbor.py +70 -0
tico/serialize/operators/op_rsqrt.py +53 -0
tico/serialize/operators/op_scalar_tensor.py +51 -0
tico/serialize/operators/op_select_copy.py +65 -0
tico/serialize/operators/op_sigmoid.py +56 -0
tico/serialize/operators/op_sin.py +53 -0
tico/serialize/operators/op_slice.py +155 -0
tico/serialize/operators/op_softmax.py +100 -0
tico/serialize/operators/op_split_with_sizes.py +96 -0
tico/serialize/operators/op_sqrt.py +55 -0
tico/serialize/operators/op_squeeze.py +73 -0
tico/serialize/operators/op_sub.py +71 -0
tico/serialize/operators/op_sum.py +63 -0
tico/serialize/operators/op_tanh.py +54 -0
tico/serialize/operators/op_to_copy.py +105 -0
tico/serialize/operators/op_unsqueeze.py +66 -0
tico/serialize/operators/op_view.py +74 -0
tico/serialize/operators/op_where.py +82 -0
tico/serialize/operators/utils.py +51 -0
tico/serialize/pack.py +35 -0
tico/serialize/quant_param.py +42 -0
tico/utils/__init__.py +1 -0
tico/utils/convert.py +292 -0
tico/utils/define.py +35 -0
tico/utils/diff_graph.py +181 -0
tico/utils/errors.py +35 -0
tico/utils/graph.py +200 -0
tico/utils/logging.py +45 -0
tico/utils/model.py +37 -0
tico/utils/padding.py +47 -0
tico/utils/passes.py +76 -0
tico/utils/register_custom_op.py +562 -0
tico/utils/trace_decorators.py +101 -0
tico/utils/utils.py +314 -0
tico/utils/validate_args_kwargs.py +1114 -0
tico-0.1.0.dev250411.dist-info/LICENSE +241 -0
tico-0.1.0.dev250411.dist-info/METADATA +17 -0
tico-0.1.0.dev250411.dist-info/RECORD +196 -0
tico-0.1.0.dev250411.dist-info/WHEEL +5 -0
tico-0.1.0.dev250411.dist-info/entry_points.txt +3 -0
tico-0.1.0.dev250411.dist-info/top_level.txt +1 -0

tico/serialize/operators/op_minimum.py ADDED Viewed

@@ -0,0 +1,53 @@
+# Copyright (c) 2025 Samsung Electronics Co., Ltd. All Rights Reserved
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from typing import Dict, List, TYPE_CHECKING
+if TYPE_CHECKING:
+    import torch._ops
+    import torch.fx
+import torch
+from circle_schema import circle
+from tico.serialize.circle_graph import CircleSubgraph
+from tico.serialize.operators.hashable_opcode import OpCode
+from tico.serialize.operators.node_visitor import NodeVisitor, register_node_visitor
+from tico.serialize.operators.utils import create_builtin_operator, get_op_index
+from tico.utils.validate_args_kwargs import MinimumArgs
+@register_node_visitor
+class MinimumVisitor(NodeVisitor):
+    target: List[torch._ops.OpOverload] = [
+        torch.ops.aten.minimum.default,
+    ]
+    def __init__(self, op_codes: Dict[OpCode, int], graph: CircleSubgraph):
+        super().__init__(op_codes, graph)
+    def define_node(self, node: torch.fx.Node) -> circle.Operator.OperatorT:
+        args = MinimumArgs(*node.args, **node.kwargs)  # type: ignore[arg-type]
+        input = args.input
+        other = args.other
+        op_index = get_op_index(
+            circle.BuiltinOperator.BuiltinOperator.MINIMUM, self._op_codes
+        )
+        inputs = [input, other]
+        outputs = [node]
+        operator = create_builtin_operator(self.graph, op_index, inputs, outputs)
+        return operator

tico/serialize/operators/op_mm.py ADDED Viewed

@@ -0,0 +1,174 @@
+# Copyright (c) 2025 Samsung Electronics Co., Ltd. All Rights Reserved
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from typing import Dict, List, TYPE_CHECKING
+if TYPE_CHECKING:
+    import torch._ops
+    import torch.fx
+import torch
+from circle_schema import circle
+from tico.serialize.circle_graph import CircleSubgraph, is_const
+from tico.serialize.operators.hashable_opcode import OpCode
+from tico.serialize.operators.node_visitor import NodeVisitor, register_node_visitor
+from tico.serialize.operators.utils import create_builtin_operator, get_op_index
+from tico.utils.validate_args_kwargs import MatmulArgs
+@register_node_visitor
+class MatmulDefaultVisitor(NodeVisitor):
+    """
+    Convert matmul to equavalent BatchMatMul or FullyConnected with Transpose.
+    """
+    target: List[torch._ops.OpOverload] = [torch.ops.aten.mm.default]
+    def __init__(self, op_codes: Dict[OpCode, int], graph: CircleSubgraph):
+        super().__init__(op_codes, graph)
+    # NOTE: Matmul is equivalent to Batch MatMul (batch=1)
+    def define_bmm_node(self, inputs, outputs) -> circle.Operator.OperatorT:
+        def set_bmm_option(operator):
+            operator.builtinOptionsType = (
+                circle.BuiltinOptions.BuiltinOptions.BatchMatMulOptions
+            )
+            option = circle.BatchMatMulOptions.BatchMatMulOptionsT()
+            option.adjointLhs, option.adjointRhs = False, False
+            option.asymmetricQuantizeInputs = False
+            operator.builtinOptions = option
+        op_index = get_op_index(
+            circle.BuiltinOperator.BuiltinOperator.BATCH_MATMUL, self._op_codes
+        )
+        operator = create_builtin_operator(self.graph, op_index, inputs, outputs)
+        set_bmm_option(operator)
+        return operator
+    def define_transpose_node(self, inputs, outputs) -> circle.Operator.OperatorT:
+        def set_transpose_option(operator):
+            operator.builtinOptionsType = (
+                circle.BuiltinOptions.BuiltinOptions.TransposeOptions
+            )
+            option = circle.TransposeOptions.TransposeOptionsT()
+            operator.builtinOptions = option
+        transpose_op_index = get_op_index(
+            circle.BuiltinOperator.BuiltinOperator.TRANSPOSE, self._op_codes
+        )
+        operator = create_builtin_operator(
+            self.graph, transpose_op_index, inputs, outputs
+        )
+        set_transpose_option(operator)
+        return operator
+    def define_fc_node(self, inputs, outputs) -> circle.Operator.OperatorT:
+        def set_fc_option(operator):
+            operator.builtinOptionsType = (
+                circle.BuiltinOptions.BuiltinOptions.FullyConnectedOptions
+            )
+            option = circle.FullyConnectedOptions.FullyConnectedOptionsT()
+            option.fusedActivationFunction = (
+                circle.ActivationFunctionType.ActivationFunctionType.NONE
+            )
+            option.weightsFormat = (
+                circle.FullyConnectedOptionsWeightsFormat.FullyConnectedOptionsWeightsFormat.DEFAULT
+            )
+            option.keepNumDims = False
+            option.asymmetricQuantizeInputs = False
+            option.quantizedBiasType = circle.TensorType.TensorType.FLOAT32
+            operator.builtinOptions = option
+        fc_op_index = get_op_index(
+            circle.BuiltinOperator.BuiltinOperator.FULLY_CONNECTED, self._op_codes
+        )
+        operator = create_builtin_operator(self.graph, fc_op_index, inputs, outputs)
+        set_fc_option(operator)
+        return operator
+    """
+    Define FullyConnnected with Tranpose operator.
+    Note that those sets of operators are equivalent.
+    (1) Matmul
+    matmul( lhs[H, K], rhs[K, W'] ) -> output(H, W')
+    (2) Transpose + FullyConneccted
+    transpose( rhs[K, W'] ) -> trs_output[W', K]
+    fullyconnected( lhs[H, K], trs_output[W', K] ) -> output(H, W')
+    """
+    def define_fc_with_transpose(self, inputs, outputs) -> circle.Operator.OperatorT:
+        lhs, rhs = inputs
+        # get transpose shape
+        rhs_tid: int = self.graph.get_tid_registered(rhs)
+        rhs_tensor: circle.Tensor.TensorT = self.graph.tensors[rhs_tid]
+        rhs_name: str = rhs.name
+        rhs_type: int = rhs_tensor.type
+        rhs_shape: List[int] = rhs_tensor.shape
+        assert len(rhs_shape) == 2, len(rhs_shape)
+        rhs_shape_transpose = [rhs_shape[1], rhs_shape[0]]
+        # create transpose output tensor
+        trs_output = self.graph.add_tensor_from_scratch(
+            prefix=f"{rhs_name}_transposed_output",
+            shape=rhs_shape_transpose,
+            dtype=rhs_type,
+        )
+        trs_perm = self.graph.add_const_tensor(data=[1, 0])
+        trs_operator = self.define_transpose_node([rhs, trs_perm], [trs_output])
+        self.graph.add_operator(trs_operator)
+        # define fc node
+        fc_input = lhs
+        fc_weight = trs_output
+        fc_shape = [fc_weight.shape[0]]
+        fc_bias = self.graph.add_const_tensor(
+            data=[0.0] * fc_shape[0],
+        )
+        operator = self.define_fc_node([fc_input, fc_weight, fc_bias], outputs)
+        return operator
+    def define_node(
+        self, node: torch.fx.Node, prior_latency=True
+    ) -> circle.Operator.OperatorT:
+        """
+        NOTE: Possibility of accuracy-latency trade-off
+        From ONE compiler's perspective:
+        - BMM uses per-tensor quantization for both rhs and lhs.
+        - FC uses per-channel quantization for weight and per-tensor for input.
+        Thus, FC is better in terms of accuracy.
+        FC necessarily involves an additional transpose operation to be identical with mm.
+        If transposed operand is const, it can be optimized by constant folding.
+        Thus, convert FC only if tranpose can be folded.
+        TODO set prior_latency outside
+        """
+        args = MatmulArgs(*node.args, **node.kwargs)  # type: ignore[arg-type]
+        input = args.input
+        other = args.other
+        inputs = [input, other]
+        outputs = [node]
+        if not is_const(other) and prior_latency:
+            operator = self.define_bmm_node(inputs, outputs)
+        else:
+            operator = self.define_fc_with_transpose(inputs, outputs)
+        return operator

tico/serialize/operators/op_mul.py ADDED Viewed

@@ -0,0 +1,99 @@
+# Copyright (c) 2025 Samsung Electronics Co., Ltd. All Rights Reserved
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from typing import Dict, List, TYPE_CHECKING
+if TYPE_CHECKING:
+    import torch._ops
+    import torch.fx
+import torch
+from circle_schema import circle
+from tico.serialize.circle_graph import CircleSubgraph
+from tico.serialize.operators.hashable_opcode import OpCode
+from tico.serialize.operators.node_visitor import NodeVisitor, register_node_visitor
+from tico.serialize.operators.utils import create_builtin_operator, get_op_index
+from tico.utils.validate_args_kwargs import MulScalarArgs, MulTensorArgs
+class BaseMulVisitor(NodeVisitor):
+    def __init__(self, op_codes: Dict[OpCode, int], graph: CircleSubgraph):
+        super().__init__(op_codes, graph)
+    def define_node(
+        self,
+        node: torch.fx.node.Node,
+    ) -> circle.Operator.OperatorT:
+        op_index = get_op_index(
+            circle.BuiltinOperator.BuiltinOperator.MUL, self._op_codes
+        )
+        inputs = list(node.args)
+        outputs = [node]
+        operator = create_builtin_operator(self.graph, op_index, inputs, outputs)
+        # Op-specific option
+        operator.builtinOptionsType = circle.BuiltinOptions.BuiltinOptions.MulOptions
+        option = circle.MulOptions.MulOptionsT()
+        option.fusedActivationFunction = (
+            circle.ActivationFunctionType.ActivationFunctionType.NONE
+        )
+        operator.builtinOptions = option
+        return operator
+@register_node_visitor
+class MulTensorVisitor(BaseMulVisitor):
+    target: List[torch._ops.OpOverload] = [torch.ops.aten.mul.Tensor]
+    def __init__(self, op_codes: Dict[OpCode, int], graph: CircleSubgraph):
+        super().__init__(op_codes, graph)
+    def define_node(
+        self,
+        node: torch.fx.Node,
+    ) -> circle.Operator.OperatorT:
+        args = MulTensorArgs(*node.args, **node.kwargs)  # type: ignore[arg-type]
+        input = args.input
+        other = args.other
+        operator = super().define_node(
+            node,
+        )
+        return operator
+@register_node_visitor
+class MulScalarVisitor(BaseMulVisitor):
+    target: List[torch._ops.OpOverload] = [torch.ops.aten.mul.Scalar]
+    def __init__(self, op_codes: Dict[OpCode, int], graph: CircleSubgraph):
+        super().__init__(op_codes, graph)
+    def define_node(
+        self,
+        node: torch.fx.Node,
+    ) -> circle.Operator.OperatorT:
+        args = MulScalarArgs(*node.args, **node.kwargs)  # type: ignore[arg-type]
+        input = args.input
+        other = args.other
+        operator = super().define_node(
+            node,
+        )
+        return operator

tico/serialize/operators/op_ne.py ADDED Viewed

@@ -0,0 +1,54 @@
+# Copyright (c) 2025 Samsung Electronics Co., Ltd. All Rights Reserved
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from typing import Dict, List, TYPE_CHECKING
+if TYPE_CHECKING:
+    import torch._ops
+    import torch.fx
+import torch
+from circle_schema import circle
+from tico.serialize.circle_graph import CircleSubgraph
+from tico.serialize.operators.hashable_opcode import OpCode
+from tico.serialize.operators.node_visitor import NodeVisitor, register_node_visitor
+from tico.serialize.operators.utils import create_builtin_operator, get_op_index
+from tico.utils.validate_args_kwargs import NeTensorArgs
+@register_node_visitor
+class NeVisitor(NodeVisitor):
+    target: List[torch._ops.OpOverload] = [
+        torch.ops.aten.ne.Scalar,
+        torch.ops.aten.ne.Tensor,
+    ]
+    def __init__(self, op_codes: Dict[OpCode, int], graph: CircleSubgraph):
+        super().__init__(op_codes, graph)
+    def define_node(self, node: torch.fx.Node) -> circle.Operator.OperatorT:
+        op_index = get_op_index(
+            circle.BuiltinOperator.BuiltinOperator.NOT_EQUAL, self._op_codes
+        )
+        args = NeTensorArgs(*node.args, **node.kwargs)  # type: ignore[arg-type]
+        input = args.input
+        other = args.other
+        inputs = [input, other]
+        outputs = [node]
+        operator = create_builtin_operator(self.graph, op_index, inputs, outputs)
+        return operator

tico/serialize/operators/op_neg.py ADDED Viewed

@@ -0,0 +1,59 @@
+# Copyright (c) 2025 Samsung Electronics Co., Ltd. All Rights Reserved
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from typing import Dict, List, TYPE_CHECKING
+if TYPE_CHECKING:
+    import torch._ops
+    import torch.fx
+import torch
+from circle_schema import circle
+from tico.serialize.circle_graph import CircleSubgraph
+from tico.serialize.operators.hashable_opcode import OpCode
+from tico.serialize.operators.node_visitor import NodeVisitor, register_node_visitor
+from tico.serialize.operators.utils import create_builtin_operator, get_op_index
+from tico.utils.validate_args_kwargs import NegArgs
+@register_node_visitor
+class NegVisitor(NodeVisitor):
+    target: List[torch._ops.OpOverload] = [torch.ops.aten.neg.default]
+    def __init__(self, op_codes: Dict[OpCode, int], graph: CircleSubgraph):
+        super().__init__(op_codes, graph)
+    def define_node(
+        self,
+        node: torch.fx.Node,
+    ) -> circle.Operator.OperatorT:
+        op_index = get_op_index(
+            circle.BuiltinOperator.BuiltinOperator.NEG,
+            self._op_codes,
+        )
+        args = NegArgs(*node.args, **node.kwargs)  # type: ignore[arg-type]
+        input = args.input
+        inputs = [input]
+        outputs = [node]
+        operator = create_builtin_operator(self.graph, op_index, inputs, outputs)
+        # Op-specific option
+        operator.builtinOptionsType = circle.BuiltinOptions.BuiltinOptions.NegOptions
+        option = circle.NegOptions.NegOptionsT()
+        operator.builtinOptions = option
+        return operator

tico/serialize/operators/op_permute.py ADDED Viewed

@@ -0,0 +1,65 @@
+# Copyright (c) 2025 Samsung Electronics Co., Ltd. All Rights Reserved
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from typing import Dict, List, TYPE_CHECKING
+if TYPE_CHECKING:
+    import torch._ops
+    import torch.fx
+import torch
+from circle_schema import circle
+from tico.serialize.circle_graph import CircleSubgraph
+from tico.serialize.circle_mapping import circle_legalize_dtype_to
+from tico.serialize.operators.hashable_opcode import OpCode
+from tico.serialize.operators.node_visitor import NodeVisitor, register_node_visitor
+from tico.serialize.operators.utils import create_builtin_operator, get_op_index
+from tico.utils.validate_args_kwargs import PermuteArgs
+@register_node_visitor
+class PermuteVisitor(NodeVisitor):
+    target: List[torch._ops.OpOverload] = [torch.ops.aten.permute.default]
+    def __init__(self, op_codes: Dict[OpCode, int], graph: CircleSubgraph):
+        super().__init__(op_codes, graph)
+    def define_node(
+        self,
+        node: torch.fx.Node,
+    ) -> circle.Operator.OperatorT:
+        op_index = get_op_index(
+            circle.BuiltinOperator.BuiltinOperator.TRANSPOSE,
+            self._op_codes,
+        )
+        args = PermuteArgs(*node.args, **node.kwargs)  # type: ignore[arg-type]
+        input = args.input
+        dims = args.dims
+        dims_i32 = circle_legalize_dtype_to(dims, dtype=torch.int32)
+        inputs = [input, dims_i32]
+        outputs = [node]
+        operator = create_builtin_operator(self.graph, op_index, inputs, outputs)
+        # Op-specific option
+        operator.builtinOptionsType = (
+            circle.BuiltinOptions.BuiltinOptions.TransposeOptions
+        )
+        option = circle.TransposeOptions.TransposeOptionsT()
+        operator.builtinOptions = option
+        return operator

tico/serialize/operators/op_pow.py ADDED Viewed

@@ -0,0 +1,138 @@
+# Copyright (c) 2025 Samsung Electronics Co., Ltd. All Rights Reserved
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from typing import Dict, List, TYPE_CHECKING
+if TYPE_CHECKING:
+    import torch._ops
+    import torch.fx
+import torch
+from circle_schema import circle
+from tico.serialize.circle_graph import CircleSubgraph
+from tico.serialize.circle_mapping import extract_torch_dtype, to_circle_dtype
+from tico.serialize.operators.hashable_opcode import OpCode
+from tico.serialize.operators.node_visitor import NodeVisitor, register_node_visitor
+from tico.serialize.operators.utils import create_builtin_operator, get_op_index
+from tico.utils.validate_args_kwargs import PowTensorScalarArgs, PowTensorTensorArgs
+class BasePowVisitor(NodeVisitor):
+    def __init__(self, op_codes: Dict[OpCode, int], graph: CircleSubgraph):
+        super().__init__(op_codes, graph)
+    def cast_to_float(self, node: torch.fx.Node) -> circle.Tensor.TensorT:
+        assert isinstance(node, torch.fx.Node), type(node)
+        node_tensor: circle.Tensor.TensorT = self.graph.get_tensor(node)
+        node_shape: List[int] = node_tensor.shape
+        op_index = get_op_index(
+            circle.BuiltinOperator.BuiltinOperator.CAST, self._op_codes
+        )
+        cast_name = f"{node.name}_cast"
+        cast_dtype = circle.TensorType.TensorType.FLOAT32
+        cast_tensor = self.graph.add_tensor_from_scratch(
+            prefix=cast_name, dtype=cast_dtype, shape=node_shape
+        )
+        cast_operator = create_builtin_operator(
+            self.graph, op_index, [node], [cast_tensor]
+        )
+        cast_operator.builtinOptionsType = (
+            circle.BuiltinOptions.BuiltinOptions.CastOptions
+        )
+        option = circle.CastOptions.CastOptionsT()
+        node_dtype = extract_torch_dtype(node)
+        option.inDataType = to_circle_dtype(node_dtype)
+        option.outDataType = cast_dtype
+        cast_operator.builtinOptions = option
+        self.graph.add_operator(cast_operator)
+        return cast_tensor
+    def define_pow_node(self, inputs: List, outputs: List) -> circle.Operator.OperatorT:
+        op_index = get_op_index(
+            circle.BuiltinOperator.BuiltinOperator.POW, self._op_codes
+        )
+        operator = create_builtin_operator(self.graph, op_index, inputs, outputs)
+        operator.builtinOptionsType = circle.BuiltinOptions.BuiltinOptions.PowOptions
+        # Pow opearation does not have any options.
+        option = circle.PowOptions.PowOptionsT()
+        operator.builtinOptions = option
+        return operator
+# TODO Support `aten::pow.Scalar` (base=scalar, exponenent=tensor)
+# ExecuTorch currently does not support it as of now (2024/02/13).
+@register_node_visitor
+class PowTensorScalarVisitor(BasePowVisitor):
+    target: List[torch._ops.OpOverload] = [torch.ops.aten.pow.Tensor_Scalar]
+    def __init__(self, op_codes: Dict[OpCode, int], graph: CircleSubgraph):
+        super().__init__(op_codes, graph)
+    def define_node(
+        self,
+        node: torch.fx.Node,
+    ) -> circle.Operator.OperatorT:
+        args = PowTensorScalarArgs(*node.args, **node.kwargs)  # type: ignore[arg-type]
+        input = args.input
+        exponent = args.exponent
+        lhs_dtype = extract_torch_dtype(input)
+        # Circle supports only same dtype between lhs and rhs.
+        if lhs_dtype == torch.float32 and isinstance(exponent, int):
+            exponent = float(exponent)
+        if lhs_dtype == torch.int32 or lhs_dtype == torch.int64:
+            if isinstance(exponent, float):
+                input = self.cast_to_float(input)  # type: ignore[assignment]
+        operator = self.define_pow_node([input, exponent], [node])
+        return operator
+@register_node_visitor
+class PowTensorTensorVisitor(BasePowVisitor):
+    target: List[torch._ops.OpOverload] = [torch.ops.aten.pow.Tensor_Tensor]
+    def __init__(self, op_codes: Dict[OpCode, int], graph: CircleSubgraph):
+        super().__init__(op_codes, graph)
+    def define_node(
+        self,
+        node: torch.fx.Node,
+    ) -> circle.Operator.OperatorT:
+        args = PowTensorTensorArgs(*node.args, **node.kwargs)  # type: ignore[arg-type]
+        input = args.input
+        exponent = args.exponent  # type: ignore[arg-type]
+        lhs_dtype = extract_torch_dtype(input)
+        rhs_dtype = extract_torch_dtype(exponent)  # type: ignore[arg-type]
+        # Circle supports only same dtype between lhs and rhs.
+        if lhs_dtype == torch.float32 and rhs_dtype == torch.int:
+            exponent = self.cast_to_float(exponent)  # type: ignore[arg-type, assignment]
+        if lhs_dtype == torch.int32 or lhs_dtype == torch.int64:
+            if rhs_dtype == torch.float32:
+                input = self.cast_to_float(input)  # type: ignore[assignment]
+        operator = self.define_pow_node([input, exponent], [node])
+        return operator