PyPI - tico - Versions diffs - 0.1.0.dev250411__py3-none-any.whl - Mend

tico 0.1.0.dev250411__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (196) hide show

tico/__init__.py +31 -0
tico/config/__init__.py +4 -0
tico/config/base.py +37 -0
tico/config/factory.py +41 -0
tico/config/v1.py +35 -0
tico/experimental/__init__.py +1 -0
tico/experimental/quantization/__init__.py +1 -0
tico/experimental/quantization/algorithm/__init__.py +1 -0
tico/experimental/quantization/algorithm/gptq/__init__.py +1 -0
tico/experimental/quantization/algorithm/gptq/gptq.py +172 -0
tico/experimental/quantization/algorithm/gptq/quant.py +153 -0
tico/experimental/quantization/algorithm/gptq/quantizer.py +225 -0
tico/experimental/quantization/algorithm/gptq/utils.py +65 -0
tico/experimental/quantization/algorithm/pt2e/__init__.py +1 -0
tico/experimental/quantization/algorithm/pt2e/annotation/__init__.py +1 -0
tico/experimental/quantization/algorithm/pt2e/annotation/annotator.py +215 -0
tico/experimental/quantization/algorithm/pt2e/annotation/config.py +26 -0
tico/experimental/quantization/algorithm/pt2e/annotation/op/__init__.py +21 -0
tico/experimental/quantization/algorithm/pt2e/annotation/op/adaptive_avg_pool2d.py +65 -0
tico/experimental/quantization/algorithm/pt2e/annotation/op/add.py +57 -0
tico/experimental/quantization/algorithm/pt2e/annotation/op/conv2d.py +92 -0
tico/experimental/quantization/algorithm/pt2e/annotation/op/div.py +57 -0
tico/experimental/quantization/algorithm/pt2e/annotation/op/linear.py +94 -0
tico/experimental/quantization/algorithm/pt2e/annotation/op/mean.py +53 -0
tico/experimental/quantization/algorithm/pt2e/annotation/op/mul.py +57 -0
tico/experimental/quantization/algorithm/pt2e/annotation/op/relu6.py +53 -0
tico/experimental/quantization/algorithm/pt2e/annotation/op/rsqrt.py +53 -0
tico/experimental/quantization/algorithm/pt2e/annotation/op/sub.py +57 -0
tico/experimental/quantization/algorithm/pt2e/annotation/spec.py +47 -0
tico/experimental/quantization/algorithm/pt2e/annotation/utils.py +88 -0
tico/experimental/quantization/algorithm/pt2e/quantizer.py +78 -0
tico/experimental/quantization/algorithm/pt2e/transformation/__init__.py +1 -0
tico/experimental/quantization/algorithm/pt2e/transformation/convert_scalars_to_attrs.py +58 -0
tico/experimental/quantization/algorithm/pt2e/utils.py +138 -0
tico/experimental/quantization/algorithm/smoothquant/__init__.py +1 -0
tico/experimental/quantization/algorithm/smoothquant/observer.py +78 -0
tico/experimental/quantization/algorithm/smoothquant/quantizer.py +81 -0
tico/experimental/quantization/algorithm/smoothquant/smooth_quant.py +164 -0
tico/experimental/quantization/config.py +68 -0
tico/experimental/quantization/evaluation/__init__.py +1 -0
tico/experimental/quantization/evaluation/backend.py +20 -0
tico/experimental/quantization/evaluation/evaluate.py +223 -0
tico/experimental/quantization/evaluation/executor/__init__.py +1 -0
tico/experimental/quantization/evaluation/executor/backend_executor.py +54 -0
tico/experimental/quantization/evaluation/executor/circle_executor.py +75 -0
tico/experimental/quantization/evaluation/executor/triv24_executor.py +128 -0
tico/experimental/quantization/evaluation/metric.py +109 -0
tico/experimental/quantization/evaluation/utils.py +185 -0
tico/experimental/quantization/passes/__init__.py +1 -0
tico/experimental/quantization/passes/fold_quant_ops.py +97 -0
tico/experimental/quantization/passes/insert_quantize_on_dtype_mismatch.py +289 -0
tico/experimental/quantization/passes/propagate_qparam_backward.py +91 -0
tico/experimental/quantization/passes/propagate_qparam_forward.py +141 -0
tico/experimental/quantization/passes/remove_weight_dequant_op.py +168 -0
tico/experimental/quantization/public_interface.py +108 -0
tico/experimental/quantization/quantizer.py +71 -0
tico/interpreter/__init__.py +1 -0
tico/interpreter/infer.py +116 -0
tico/interpreter/interpreter.py +93 -0
tico/passes/__init__.py +1 -0
tico/passes/cast_aten_where_arg_type.py +185 -0
tico/passes/cast_mixed_type_args.py +186 -0
tico/passes/const_prop_pass.py +307 -0
tico/passes/convert_conv1d_to_conv2d.py +151 -0
tico/passes/convert_layout_op_to_reshape.py +84 -0
tico/passes/convert_repeat_to_expand_copy.py +90 -0
tico/passes/convert_to_relu6.py +180 -0
tico/passes/decompose_addmm.py +127 -0
tico/passes/decompose_batch_norm.py +198 -0
tico/passes/decompose_fake_quantize.py +126 -0
tico/passes/decompose_fake_quantize_tensor_qparams.py +270 -0
tico/passes/decompose_group_norm.py +258 -0
tico/passes/decompose_grouped_conv2d.py +202 -0
tico/passes/decompose_slice_scatter.py +167 -0
tico/passes/extract_dtype_kwargs.py +121 -0
tico/passes/fill_meta_val.py +57 -0
tico/passes/fuse_redundant_reshape_to_mean.py +102 -0
tico/passes/legalize_causal_mask_value.py +113 -0
tico/passes/legalize_predefined_layout_operators.py +383 -0
tico/passes/lower_pow2_to_mul.py +75 -0
tico/passes/lower_to_resize_nearest_neighbor.py +249 -0
tico/passes/lower_to_slice.py +112 -0
tico/passes/merge_consecutive_cat.py +82 -0
tico/passes/ops.py +75 -0
tico/passes/remove_nop.py +85 -0
tico/passes/remove_redundant_assert_nodes.py +50 -0
tico/passes/remove_redundant_expand.py +70 -0
tico/passes/remove_redundant_permute.py +102 -0
tico/passes/remove_redundant_reshape.py +431 -0
tico/passes/remove_redundant_slice.py +64 -0
tico/passes/remove_redundant_to_copy.py +84 -0
tico/passes/restore_linear.py +113 -0
tico/passes/segment_index_select.py +143 -0
tico/pt2_to_circle.py +101 -0
tico/serialize/__init__.py +1 -0
tico/serialize/circle_graph.py +264 -0
tico/serialize/circle_mapping.py +177 -0
tico/serialize/circle_serializer.py +232 -0
tico/serialize/operators/__init__.py +28 -0
tico/serialize/operators/hashable_opcode.py +43 -0
tico/serialize/operators/node_visitor.py +80 -0
tico/serialize/operators/op_add.py +69 -0
tico/serialize/operators/op_alias_copy.py +64 -0
tico/serialize/operators/op_any.py +142 -0
tico/serialize/operators/op_arange_start_step.py +61 -0
tico/serialize/operators/op_argmax.py +62 -0
tico/serialize/operators/op_avg_pool2d.py +112 -0
tico/serialize/operators/op_bmm.py +62 -0
tico/serialize/operators/op_cat.py +66 -0
tico/serialize/operators/op_clamp.py +123 -0
tico/serialize/operators/op_clone.py +71 -0
tico/serialize/operators/op_constant_pad_nd.py +72 -0
tico/serialize/operators/op_conv2d.py +181 -0
tico/serialize/operators/op_copy.py +162 -0
tico/serialize/operators/op_cos.py +59 -0
tico/serialize/operators/op_cumsum.py +92 -0
tico/serialize/operators/op_depthwise_conv2d.py +198 -0
tico/serialize/operators/op_dequantize_per_channel.py +82 -0
tico/serialize/operators/op_dequantize_per_tensor.py +64 -0
tico/serialize/operators/op_div.py +62 -0
tico/serialize/operators/op_embedding.py +60 -0
tico/serialize/operators/op_eq.py +64 -0
tico/serialize/operators/op_exp.py +60 -0
tico/serialize/operators/op_expand.py +91 -0
tico/serialize/operators/op_full.py +48 -0
tico/serialize/operators/op_full_like.py +55 -0
tico/serialize/operators/op_ge.py +54 -0
tico/serialize/operators/op_gelu.py +59 -0
tico/serialize/operators/op_gt.py +54 -0
tico/serialize/operators/op_index.py +82 -0
tico/serialize/operators/op_index_select.py +64 -0
tico/serialize/operators/op_instance_norm.py +91 -0
tico/serialize/operators/op_linear.py +70 -0
tico/serialize/operators/op_log.py +53 -0
tico/serialize/operators/op_log1p.py +83 -0
tico/serialize/operators/op_logical_and.py +63 -0
tico/serialize/operators/op_logical_not.py +62 -0
tico/serialize/operators/op_lt.py +61 -0
tico/serialize/operators/op_max_pool2d_with_indices.py +140 -0
tico/serialize/operators/op_maximum.py +53 -0
tico/serialize/operators/op_mean.py +66 -0
tico/serialize/operators/op_minimum.py +53 -0
tico/serialize/operators/op_mm.py +174 -0
tico/serialize/operators/op_mul.py +99 -0
tico/serialize/operators/op_ne.py +54 -0
tico/serialize/operators/op_neg.py +59 -0
tico/serialize/operators/op_permute.py +65 -0
tico/serialize/operators/op_pow.py +138 -0
tico/serialize/operators/op_prelu.py +54 -0
tico/serialize/operators/op_quantize_per_tensor.py +79 -0
tico/serialize/operators/op_reciprocal.py +64 -0
tico/serialize/operators/op_relu.py +53 -0
tico/serialize/operators/op_relu6.py +52 -0
tico/serialize/operators/op_repeat.py +99 -0
tico/serialize/operators/op_reshape.py +73 -0
tico/serialize/operators/op_resize_nearest_neighbor.py +70 -0
tico/serialize/operators/op_rsqrt.py +53 -0
tico/serialize/operators/op_scalar_tensor.py +51 -0
tico/serialize/operators/op_select_copy.py +65 -0
tico/serialize/operators/op_sigmoid.py +56 -0
tico/serialize/operators/op_sin.py +53 -0
tico/serialize/operators/op_slice.py +155 -0
tico/serialize/operators/op_softmax.py +100 -0
tico/serialize/operators/op_split_with_sizes.py +96 -0
tico/serialize/operators/op_sqrt.py +55 -0
tico/serialize/operators/op_squeeze.py +73 -0
tico/serialize/operators/op_sub.py +71 -0
tico/serialize/operators/op_sum.py +63 -0
tico/serialize/operators/op_tanh.py +54 -0
tico/serialize/operators/op_to_copy.py +105 -0
tico/serialize/operators/op_unsqueeze.py +66 -0
tico/serialize/operators/op_view.py +74 -0
tico/serialize/operators/op_where.py +82 -0
tico/serialize/operators/utils.py +51 -0
tico/serialize/pack.py +35 -0
tico/serialize/quant_param.py +42 -0
tico/utils/__init__.py +1 -0
tico/utils/convert.py +292 -0
tico/utils/define.py +35 -0
tico/utils/diff_graph.py +181 -0
tico/utils/errors.py +35 -0
tico/utils/graph.py +200 -0
tico/utils/logging.py +45 -0
tico/utils/model.py +37 -0
tico/utils/padding.py +47 -0
tico/utils/passes.py +76 -0
tico/utils/register_custom_op.py +562 -0
tico/utils/trace_decorators.py +101 -0
tico/utils/utils.py +314 -0
tico/utils/validate_args_kwargs.py +1114 -0
tico-0.1.0.dev250411.dist-info/LICENSE +241 -0
tico-0.1.0.dev250411.dist-info/METADATA +17 -0
tico-0.1.0.dev250411.dist-info/RECORD +196 -0
tico-0.1.0.dev250411.dist-info/WHEEL +5 -0
tico-0.1.0.dev250411.dist-info/entry_points.txt +3 -0
tico-0.1.0.dev250411.dist-info/top_level.txt +1 -0

tico/serialize/operators/op_cos.py ADDED Viewed

@@ -0,0 +1,59 @@
+# Copyright (c) 2025 Samsung Electronics Co., Ltd. All Rights Reserved
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from typing import Dict, List, TYPE_CHECKING
+if TYPE_CHECKING:
+    import torch._ops
+    import torch.fx
+import torch
+from circle_schema import circle
+from tico.serialize.circle_graph import CircleSubgraph
+from tico.serialize.operators.hashable_opcode import OpCode
+from tico.serialize.operators.node_visitor import NodeVisitor, register_node_visitor
+from tico.serialize.operators.utils import create_builtin_operator, get_op_index
+from tico.utils.validate_args_kwargs import CosArgs
+@register_node_visitor
+class CosVisitor(NodeVisitor):
+    target: List[torch._ops.OpOverload] = [torch.ops.aten.cos.default]
+    def __init__(self, op_codes: Dict[OpCode, int], graph: CircleSubgraph):
+        super().__init__(op_codes, graph)
+    def define_node(
+        self,
+        node: torch.fx.Node,
+    ) -> circle.Operator.OperatorT:
+        args = CosArgs(*node.args, **node.kwargs)  # type: ignore[arg-type]
+        input = args.input
+        op_index = get_op_index(
+            circle.BuiltinOperator.BuiltinOperator.COS, self._op_codes
+        )
+        inputs = [input]
+        outputs = [node]
+        operator = create_builtin_operator(self.graph, op_index, inputs, outputs)
+        # Op-specific option
+        operator.builtinOptionsType = circle.BuiltinOptions.BuiltinOptions.CosOptions
+        option = circle.CosOptions.CosOptionsT()
+        operator.builtinOptions = option
+        return operator

tico/serialize/operators/op_cumsum.py ADDED Viewed

@@ -0,0 +1,92 @@
+# Copyright (c) 2025 Samsung Electronics Co., Ltd. All Rights Reserved
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from typing import Dict, List, TYPE_CHECKING
+if TYPE_CHECKING:
+    import torch._ops
+    import torch.fx
+import torch
+from circle_schema import circle
+from tico.serialize.circle_graph import CircleSubgraph
+from tico.serialize.circle_mapping import (
+    circle_legalize_dtype_to,
+    extract_torch_dtype,
+    to_circle_dtype,
+)
+from tico.serialize.operators.hashable_opcode import OpCode
+from tico.serialize.operators.node_visitor import NodeVisitor, register_node_visitor
+from tico.serialize.operators.utils import create_builtin_operator, get_op_index
+from tico.utils.validate_args_kwargs import CumsumArgs
+@register_node_visitor
+class CumsumVisitor(NodeVisitor):
+    target: List[torch._ops.OpOverload] = [torch.ops.aten.cumsum.default]
+    def __init__(self, op_codes: Dict[OpCode, int], graph: CircleSubgraph):
+        super().__init__(op_codes, graph)
+    def define_node(
+        self,
+        node: torch.fx.Node,
+    ) -> circle.Operator.OperatorT:
+        args = CumsumArgs(*node.args, **node.kwargs)  # type: ignore[arg-type]
+        input = args.input
+        dim = args.dim
+        dim_i32 = circle_legalize_dtype_to(dim, dtype=torch.int32)
+        casted_input: torch.fx.Node | circle.Tensor.TensorT = input
+        # torch.cumsum doesn't follow input dtype when input dtype is int32.
+        # Since circle-interpreter needs a model to have same dtype between input and output,
+        #   let's cast the input to torch.int64.
+        input_dtype = extract_torch_dtype(input)
+        if input_dtype == torch.int32:
+            input_tensor: circle.Tensor.TensorT = self.graph.get_tensor(input)
+            input_shape: List[int] = input_tensor.shape
+            cast_op_index = get_op_index(
+                circle.BuiltinOperator.BuiltinOperator.CAST, self._op_codes
+            )
+            cast_name = f"{input.name}_cast"
+            cast_dtype = circle.TensorType.TensorType.INT64
+            cast_tensor = self.graph.add_tensor_from_scratch(
+                prefix=cast_name, dtype=cast_dtype, shape=input_shape
+            )
+            cast_operator = create_builtin_operator(
+                self.graph, cast_op_index, [input], [cast_tensor]
+            )
+            cast_operator.builtinOptionsType = (
+                circle.BuiltinOptions.BuiltinOptions.CastOptions
+            )
+            cast_option = circle.CastOptions.CastOptionsT()
+            cast_option.inDataType = to_circle_dtype(input_dtype)
+            cast_option.outDataType = cast_dtype
+            cast_operator.builtinOptions = cast_option
+            self.graph.add_operator(cast_operator)
+            casted_input = cast_tensor
+        inputs = [casted_input, dim_i32]
+        outputs = [node]
+        op_index = get_op_index(
+            circle.BuiltinOperator.BuiltinOperator.CUMSUM, self._op_codes
+        )
+        operator = create_builtin_operator(self.graph, op_index, inputs, outputs)
+        operator.builtinOptionsType = circle.BuiltinOptions.BuiltinOptions.CumsumOptions
+        option = circle.CumsumOptions.CumsumOptionsT()
+        operator.builtinOptions = option
+        return operator

tico/serialize/operators/op_depthwise_conv2d.py ADDED Viewed

@@ -0,0 +1,198 @@
+# Copyright (c) 2025 Samsung Electronics Co., Ltd. All Rights Reserved
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from typing import Dict, List, TYPE_CHECKING
+if TYPE_CHECKING:
+    import torch._ops
+    import torch.fx
+import torch
+from circle_schema import circle
+from tico.serialize.circle_mapping import extract_circle_dtype, extract_shape
+from tico.serialize.operators.hashable_opcode import OpCode
+from tico.serialize.operators.node_visitor import NodeVisitor, register_node_visitor
+from tico.serialize.operators.utils import create_builtin_operator, get_op_index
+from tico.utils.define import define_pad_node
+from tico.utils.padding import is_same_padding, is_valid_padding, SAME, VALID
+from tico.utils.validate_args_kwargs import Conv2DArgs
+@register_node_visitor
+class DepthwiseConv2dVisitor(NodeVisitor):
+    """
+    NOTE
+    - The padding of DepthwiseCircleConv2D has only padding type('VALID', 'SAME') in circle, but the padding of nn.Conv2d has padding type(('valid', 'same')), padding value(int)
+    and padding value(tuple->[pad_h, pad_w]).
+    ref: https://tensorflow.org/api_docs/python/tf/nn/depthwise_conv2d
+    [1] With valid/same padding: DepthwiseCircleConv2D (only)
+        [ATEN IR]
+        Input[NHWC] ---- circle_cumstom.depthwise_conv2d[NHWC] ---- OUTPUT[NHWC]
+        Weight[NHWC] ---/
+        Bias ----------/
+        [CIRCLE IR]
+        Input[NHWC] ----  DepthwiseCircleConv2D[NHWC] ---- OUTPUT[NHWC]
+        Weight[NHWC] ---/
+        Bias ----------/
+    [2] With additional padding: CirclePad + DepthwiseCircleConv2D
+        [ATEN IR]
+        Input[NHWC] ---- circle_cumstom.depthwise_conv2d[NHWC] ---- OUTPUT[NHWC]
+        Weight[NHWC] ---/
+        Bias ----------/
+        [CIRCLE IR]
+        Input[NHWC] ---- CirclePad[NHWC] ---- DepthwiseCircleConv2D[NHWC] ---- OUTPUT[NHWC]
+                         Weight[NHWC] ------/
+                         Bias -------------/
+    """
+    target: List[torch._ops.OpOverload] = [
+        torch.ops.circle_custom.depthwise_conv2d,
+        torch.ops.circle_custom.depthwise_conv2d.padding,
+    ]
+    def __init__(self, op_codes: Dict[OpCode, int], graph):
+        super().__init__(op_codes, graph)
+    def define_dconv_node(
+        self,
+        padding: int,
+        stride: List[int],
+        dilation: List[int],
+        depthMultiplier: int,
+        inputs: List,
+        outputs: List,
+    ) -> circle.Operator.OperatorT:
+        def set_conv2d_option(operator, stride, dilation):
+            operator.builtinOptionsType = (
+                circle.BuiltinOptions.BuiltinOptions.DepthwiseConv2DOptions
+            )
+            option = circle.DepthwiseConv2DOptions.DepthwiseConv2DOptionsT()
+            option.padding = padding
+            option.strideH = stride[0]
+            option.strideW = stride[1]
+            option.depthMultiplier = depthMultiplier
+            option.dilationHFactor = dilation[0]
+            option.dilationWFactor = dilation[1]
+            option.fusedActivationFunction = (
+                circle.ActivationFunctionType.ActivationFunctionType.NONE
+            )
+            operator.builtinOptions = option
+        conv2d_op_index = get_op_index(
+            circle.BuiltinOperator.BuiltinOperator.DEPTHWISE_CONV_2D, self._op_codes
+        )
+        operator = create_builtin_operator(self.graph, conv2d_op_index, inputs, outputs)
+        set_conv2d_option(operator, stride, dilation)
+        return operator
+    def define_node(self, node: torch.fx.Node) -> circle.Operator.OperatorT:
+        # Let's get Conv2dArgs because torch Conv2D with group == input_channel maps to CircleDepthwiseConv2D
+        args = Conv2DArgs(*node.args, **node.kwargs)  # type: ignore[arg-type]
+        input_ = args.input
+        weight = args.weight
+        bias = args.bias
+        stride = args.stride
+        padding = args.padding
+        dilation = args.dilation
+        groups = args.groups
+        input_dtype: int = extract_circle_dtype(input_)
+        input_shape = list(extract_shape(input_))  # OHWI
+        assert len(input_shape) == 4, len(input_shape)
+        output_shape = list(extract_shape(node))  # OHWI
+        assert len(output_shape) == 4, len(output_shape)
+        weight_shape = list(extract_shape(weight))  # 1HWO
+        assert (
+            weight_shape[3] % groups == 0
+        ), "Depthwise convolution requires output channel to be divisible by groups"
+        assert weight_shape[0] == 1
+        assert weight_shape[3] == output_shape[3]
+        assert input_shape[3] == groups
+        depthMultiplier = weight_shape[3] // input_shape[3]
+        assert weight_shape[3] % input_shape[3] == 0, "depthMultiplier must be integer"
+        conv_input: torch.fx.node.Node | circle.Tensor.TensorT = input_
+        if is_valid_padding(padding):
+            dconv2d_padding_type = VALID
+        elif is_same_padding(padding, input_shape, output_shape):
+            dconv2d_padding_type = SAME
+        else:
+            assert isinstance(padding, list) and len(padding) == 2
+            dconv2d_padding_type = VALID
+            # Padding is not valid or same, so we use valid padding and add padding operator before conv2d operator.
+            # when data_format is "NHWC", padding should be [[0, 0], [pad_top, pad_bottom], [pad_left, pad_right], [0, 0]]
+            paddings = torch.tensor(
+                [
+                    [0, 0],
+                    [padding[0], padding[0]],
+                    [padding[1], padding[1]],
+                    [0, 0],
+                ],
+                dtype=torch.int32,
+            )
+            pad_output_shape = [
+                input_shape[0],
+                input_shape[1],
+                input_shape[2],
+                input_shape[3],
+            ]
+            # Add (pad_top+pad_bottom) to pad_output_shape_h
+            pad_output_shape[1] += padding[0] * 2
+            # Add (pad_left+pad_Right) to pad_output_shape_w
+            pad_output_shape[2] += padding[1] * 2
+            # create padded output tensor
+            pad_output = self.graph.add_tensor_from_scratch(
+                prefix=f"{node.name}_input_pad_output",
+                shape=pad_output_shape,
+                dtype=input_dtype,
+            )
+            # CirclePad
+            pad_operator = define_pad_node(
+                self.graph, self._op_codes, [input_, paddings], [pad_output]
+            )
+            self.graph.add_operator(pad_operator)
+            conv_input = pad_output
+        if bias is None:
+            # luci-interpreter can't run no bias conv. Let's add zero vector for bias.
+            assert len(weight_shape) == 4
+            out_channel = weight_shape[3]
+            bias = [0.0] * out_channel  # type: ignore[assignment]
+        # DConv2D
+        dconv2d_operator = self.define_dconv_node(
+            dconv2d_padding_type,
+            stride,
+            dilation,
+            depthMultiplier,
+            [conv_input, weight, bias],
+            [node],
+        )
+        return dconv2d_operator

tico/serialize/operators/op_dequantize_per_channel.py ADDED Viewed

@@ -0,0 +1,82 @@
+# Copyright (c) 2025 Samsung Electronics Co., Ltd. All Rights Reserved
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from typing import Dict, List, TYPE_CHECKING
+if TYPE_CHECKING:
+    import torch._ops
+    import torch.fx
+import numpy as np
+import torch
+from circle_schema import circle
+from tico.serialize.circle_graph import CircleSubgraph
+from tico.serialize.operators.hashable_opcode import OpCode
+from tico.serialize.operators.node_visitor import NodeVisitor, register_node_visitor
+from tico.serialize.operators.utils import create_builtin_operator, get_op_index
+from tico.utils.validate_args_kwargs import DequantizePerChannelArgs
+@register_node_visitor
+class DequantizePerChannelDefaultVisitor(NodeVisitor):
+    target: List[torch._ops.OpOverload] = [
+        torch.ops.quantized_decomposed.dequantize_per_channel.default
+    ]
+    def __init__(self, op_codes: Dict[OpCode, int], graph: CircleSubgraph):
+        super().__init__(op_codes, graph)
+    def define_node(
+        self,
+        node: torch.fx.Node,
+    ) -> circle.Operator.OperatorT:
+        args = DequantizePerChannelArgs(*node.args, **node.kwargs)  # type: ignore[arg-type]
+        input = args.input
+        scales = args.scales
+        zero_points = args.zero_points
+        axis = args.axis
+        quant_min = args.quant_min
+        quant_max = args.quant_max
+        output_tensor: circle.Tensor.TensorT = self.graph.get_tensor(node)
+        assert not output_tensor.quantization
+        quant_param = circle.QuantizationParameters.QuantizationParametersT()
+        quant_param.min = [quant_min]
+        quant_param.max = [quant_max]
+        # Retrieve scale
+        scale_buf = bytes(self.graph.get_buffer(scales).data)
+        quant_param.scale = np.frombuffer(scale_buf, dtype=np.float32).tolist()  # type: ignore[assignment]
+        # Retrieve zp
+        zp_buf = bytes(self.graph.get_buffer(zero_points).data)
+        quant_param.zeroPoint = np.frombuffer(zp_buf, dtype=np.int32).tolist()  # type: ignore[assignment]
+        quant_param.quantizedDimension = axis
+        output_tensor.quantization = quant_param
+        inputs = [input]
+        outputs = [node]
+        op_index = get_op_index(
+            circle.BuiltinOperator.BuiltinOperator.DEQUANTIZE, self._op_codes
+        )
+        operator = create_builtin_operator(self.graph, op_index, inputs, outputs)
+        # Op-specific option
+        operator.builtinOptionsType = (
+            circle.BuiltinOptions.BuiltinOptions.DequantizeOptions
+        )
+        option = circle.DequantizeOptions.DequantizeOptionsT()
+        operator.builtinOptions = option
+        return operator

tico/serialize/operators/op_dequantize_per_tensor.py ADDED Viewed

@@ -0,0 +1,64 @@
+# Copyright (c) 2025 Samsung Electronics Co., Ltd. All Rights Reserved
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from typing import Dict, List, TYPE_CHECKING
+if TYPE_CHECKING:
+    import torch._ops
+    import torch.fx
+import torch
+from circle_schema import circle
+from tico.serialize.circle_graph import CircleSubgraph
+from tico.serialize.operators.hashable_opcode import OpCode
+from tico.serialize.operators.node_visitor import NodeVisitor, register_node_visitor
+from tico.serialize.operators.utils import create_builtin_operator, get_op_index
+from tico.utils.validate_args_kwargs import DequantizePerTensorArgs
+@register_node_visitor
+class DequantizePerTensorDefaultVisitor(NodeVisitor):
+    target: List[torch._ops.OpOverload] = [
+        torch.ops.quantized_decomposed.dequantize_per_tensor.default
+    ]
+    def __init__(self, op_codes: Dict[OpCode, int], graph: CircleSubgraph):
+        super().__init__(op_codes, graph)
+    def define_node(
+        self,
+        node: torch.fx.Node,
+    ) -> circle.Operator.OperatorT:
+        args = DequantizePerTensorArgs(*node.args, **node.kwargs)  # type: ignore[arg-type]
+        input = args.input
+        input_tensor: circle.Tensor.TensorT = self.graph.get_tensor(input)
+        assert input_tensor.quantization
+        inputs = [input]
+        outputs = [node]
+        op_index = get_op_index(
+            circle.BuiltinOperator.BuiltinOperator.DEQUANTIZE, self._op_codes
+        )
+        operator = create_builtin_operator(self.graph, op_index, inputs, outputs)
+        # Op-specific option
+        operator.builtinOptionsType = (
+            circle.BuiltinOptions.BuiltinOptions.DequantizeOptions
+        )
+        option = circle.DequantizeOptions.DequantizeOptionsT()
+        operator.builtinOptions = option
+        return operator

tico/serialize/operators/op_div.py ADDED Viewed

@@ -0,0 +1,62 @@
+# Copyright (c) 2025 Samsung Electronics Co., Ltd. All Rights Reserved
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from typing import Dict, List, TYPE_CHECKING
+if TYPE_CHECKING:
+    import torch._ops
+    import torch.fx
+import torch
+from circle_schema import circle
+from tico.serialize.circle_graph import CircleSubgraph
+from tico.serialize.operators.hashable_opcode import OpCode
+from tico.serialize.operators.node_visitor import NodeVisitor, register_node_visitor
+from tico.serialize.operators.utils import create_builtin_operator, get_op_index
+from tico.utils.validate_args_kwargs import DivTensorArgs
+@register_node_visitor
+class DivVisitor(NodeVisitor):
+    target: List[torch._ops.OpOverload] = [torch.ops.aten.div.Tensor]
+    def __init__(self, op_codes: Dict[OpCode, int], graph: CircleSubgraph):
+        super().__init__(op_codes, graph)
+    def define_node(
+        self,
+        node: torch.fx.Node,
+    ) -> circle.Operator.OperatorT:
+        args = DivTensorArgs(*node.args, **node.kwargs)  # type: ignore[arg-type]
+        input = args.input
+        other = args.other
+        op_index = get_op_index(
+            circle.BuiltinOperator.BuiltinOperator.DIV, self._op_codes
+        )
+        inputs = [input, other]
+        outputs = [node]
+        operator = create_builtin_operator(self.graph, op_index, inputs, outputs)
+        # Op-specific option
+        operator.builtinOptionsType = circle.BuiltinOptions.BuiltinOptions.DivOptions
+        option = circle.DivOptions.DivOptionsT()
+        option.fusedActivationFunction = (
+            circle.ActivationFunctionType.ActivationFunctionType.NONE
+        )
+        operator.builtinOptions = option
+        return operator

tico/serialize/operators/op_embedding.py ADDED Viewed

@@ -0,0 +1,60 @@
+# Copyright (c) 2025 Samsung Electronics Co., Ltd. All Rights Reserved
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from typing import Dict, List, TYPE_CHECKING
+if TYPE_CHECKING:
+    import torch._ops
+    import torch.fx
+import torch
+from circle_schema import circle
+from tico.serialize.operators.hashable_opcode import OpCode
+from tico.serialize.operators.node_visitor import NodeVisitor, register_node_visitor
+from tico.serialize.operators.utils import create_builtin_operator, get_op_index
+from tico.utils.validate_args_kwargs import EmbeddingArgs
+@register_node_visitor
+class EmbeddingVisitor(NodeVisitor):
+    target: List[torch._ops.OpOverload] = [torch.ops.aten.embedding.default]
+    def __init__(self, op_codes: Dict[OpCode, int], graph):
+        super().__init__(op_codes, graph)
+    def define_node(
+        self,
+        node: torch.fx.Node,
+    ) -> circle.Operator.OperatorT:
+        op_index = get_op_index(
+            circle.BuiltinOperator.BuiltinOperator.GATHER, self._op_codes
+        )
+        args = EmbeddingArgs(*node.args, **node.kwargs)  # type: ignore[arg-type]
+        # do not need to handle optional parameters, since all options are related to Embedding Table values.
+        embedding_table = args.weight
+        index_tensor = args.indices
+        inputs = [embedding_table, index_tensor]
+        outputs = [node]
+        operator = create_builtin_operator(self.graph, op_index, inputs, outputs)
+        # Op-specific option
+        operator.builtinOptionsType = circle.BuiltinOptions.BuiltinOptions.GatherOptions
+        option = circle.GatherOptions.GatherOptionsT()
+        option.axis = 0
+        operator.builtinOptions = option
+        # Op-specific option does not exists for Embedding.
+        return operator

tico/serialize/operators/op_eq.py ADDED Viewed

@@ -0,0 +1,64 @@
+# Copyright (c) 2025 Samsung Electronics Co., Ltd. All Rights Reserved
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from typing import Dict, List, TYPE_CHECKING
+if TYPE_CHECKING:
+    import torch._ops
+    import torch.fx
+import torch
+from circle_schema import circle
+from tico.serialize.circle_graph import CircleSubgraph
+from tico.serialize.operators.hashable_opcode import OpCode
+from tico.serialize.operators.node_visitor import NodeVisitor, register_node_visitor
+from tico.serialize.operators.utils import create_builtin_operator, get_op_index
+from tico.utils.validate_args_kwargs import EqArgs
+@register_node_visitor
+class EqVisitor(NodeVisitor):
+    target: List[torch._ops.OpOverload] = [
+        torch.ops.aten.eq.Scalar,
+        torch.ops.aten.eq.Tensor,
+    ]
+    def __init__(self, op_codes: Dict[OpCode, int], graph: CircleSubgraph):
+        super().__init__(op_codes, graph)
+    def define_node(
+        self,
+        node: torch.fx.Node,
+    ) -> circle.Operator.OperatorT:
+        args = EqArgs(*node.args, **node.kwargs)  # type: ignore[arg-type]
+        input = args.input
+        other = args.other
+        op_index = get_op_index(
+            circle.BuiltinOperator.BuiltinOperator.EQUAL,
+            self._op_codes,
+        )
+        inputs = [input, other]
+        outputs = [node]
+        operator = create_builtin_operator(self.graph, op_index, inputs, outputs)
+        # Op-specific option
+        operator.builtinOptionsType = circle.BuiltinOptions.BuiltinOptions.EqualOptions
+        option = circle.EqualOptions.EqualOptionsT()
+        operator.builtinOptions = option
+        return operator