PyPI - mct-nightly - Versions diffs - 2.4.0.20250608.655__py3-none-any.whl → 2.4.0.20250609.615__py3-none-any.whl - Mend

mct-nightly 2.4.0.20250608.655py3-none-any.whl → 2.4.0.20250609.615py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (11) hide show

{mct_nightly-2.4.0.20250608.655.dist-info → mct_nightly-2.4.0.20250609.615.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: mct-nightly
-Version: 2.4.0.20250608.655
+Version: 2.4.0.20250609.615
 Summary: A Model Compression Toolkit for neural networks
 Author-email: ssi-dnn-dev@sony.com
 Classifier: Programming Language :: Python :: 3

{mct_nightly-2.4.0.20250608.655.dist-info → mct_nightly-2.4.0.20250609.615.dist-info}/RECORD RENAMED Viewed

@@ -1,5 +1,5 @@
-mct_nightly-2.4.0.20250608.655.dist-info/licenses/LICENSE.md,sha256=aYSSIb-5AFPeITTvXm1UAoe0uYBiMmSS8flvXaaFUks,10174
-model_compression_toolkit/__init__.py,sha256=9nm4cV4Z-_J1NtF0o6cjMqNu_GjdOWHTgWglMLmuB9Y,1557
+mct_nightly-2.4.0.20250609.615.dist-info/licenses/LICENSE.md,sha256=aYSSIb-5AFPeITTvXm1UAoe0uYBiMmSS8flvXaaFUks,10174
+model_compression_toolkit/__init__.py,sha256=iZK1iC0PgvlQ8g_69klbV_2fHfkRz-cbEc-fJLlJHQY,1557
 model_compression_toolkit/constants.py,sha256=KNgiNLpsMgSYyXMNEbHXd4bFNerQc1D6HH3vpbUq_Gs,4086
 model_compression_toolkit/defaultdict.py,sha256=LSc-sbZYXENMCw3U9F4GiXuv67IKpdn0Qm7Fr11jy-4,2277
 model_compression_toolkit/logger.py,sha256=L3q7tn3Uht0i_7phnlOWMR2Te2zvzrt2HOz9vYEInts,4529
@@ -16,7 +16,7 @@ model_compression_toolkit/core/common/framework_implementation.py,sha256=JQI_eoZ
 model_compression_toolkit/core/common/framework_info.py,sha256=5tderHT-7Cd21QrRFIJj3hH_gAcnlivOzwZ5m1ldJOs,6526
 model_compression_toolkit/core/common/memory_computation.py,sha256=ixoSpV5ZYZGyzhre3kQcvR2sNA8KBsPZ3lgbkDnw9Cs,1205
 model_compression_toolkit/core/common/model_builder_mode.py,sha256=jll9-59OPaE3ug7Y9-lLyV99_FoNHxkGZMgcm0Vkpss,1324
-model_compression_toolkit/core/common/model_collector.py,sha256=ssYLdo2FPEzXoFKQonUA3ZbrIaDp-UmLhv0mWMCHH8U,13225
+model_compression_toolkit/core/common/model_collector.py,sha256=AbnJVjDlpmQZyj3Ba0XkK76zWh5dqcDFJdKXFTq25uw,13420
 model_compression_toolkit/core/common/model_validation.py,sha256=LaG8wd6aZl0OJgieE3SeiVDEPxtk8IHq9-3wSnmWhY4,1214
 model_compression_toolkit/core/common/node_prior_info.py,sha256=WXX_PrGVG9M9I_REG5ZzFBohwmV4yf356sZnrja_FLo,2832
 model_compression_toolkit/core/common/similarity_analyzer.py,sha256=S3f6WgHyw62dGcxpX51FGKyfebe2zv9ABKbjtGyKRvY,9215
@@ -31,10 +31,10 @@ model_compression_toolkit/core/common/collectors/min_max_per_channel_collector.p
 model_compression_toolkit/core/common/collectors/statistics_collector.py,sha256=psijsQZefwjMDH8SU5E18n65HiGtQilPhKr1hhzZX-I,8268
 model_compression_toolkit/core/common/collectors/weighted_histogram_collector.py,sha256=zp3dE7YTqWmkD5QWdRhsl9zD8W6Lr96G1Wjw1g2D3T0,4894
 model_compression_toolkit/core/common/fusion/__init__.py,sha256=Rf1RcYmelmdZmBV5qOKvKWF575ofc06JFQSq83Jz99A,696
-model_compression_toolkit/core/common/fusion/fusing_info.py,sha256=uDxF0awrjn3SbcpXBpoQ4OGcKO6Z7HBk8ierZPCGbGo,21970
+model_compression_toolkit/core/common/fusion/fusing_info.py,sha256=Z-O03-DlM4XyllVg5FaQlYeIgk5UqoC8dSA6IlRODNI,22693
 model_compression_toolkit/core/common/fusion/graph_fuser.py,sha256=yxxxuwrmQ4wLW-PlTu0MEW59LmNJEh1OWy9Li15YH-8,7520
 model_compression_toolkit/core/common/graph/__init__.py,sha256=Xr-Lt_qXMdrCnnOaUS_OJP_3iTTGfPCLf8_vSrQgCs0,773
-model_compression_toolkit/core/common/graph/base_graph.py,sha256=YA0c8ucaaZu9eRO-xruLqDT3QFOpxq24ViG6ILS2jqA,41403
+model_compression_toolkit/core/common/graph/base_graph.py,sha256=NmGvxGg-UHsNEjz_mtwLhS0HMEM2-pbQPPax1QUw4o0,41378
 model_compression_toolkit/core/common/graph/base_node.py,sha256=8GEqZ8VMtVvJZuiSUVdokCq6NkFosOssetcod21DwDM,33604
 model_compression_toolkit/core/common/graph/edge.py,sha256=buoSEUZwilWBK3WeBKpJ-GeDaUA1SDdOHxDpxU_bGpk,3784
 model_compression_toolkit/core/common/graph/functional_node.py,sha256=GH5wStmw8SoAj5IdT_-ItN1Meo_P5NUTt_5bgJC4fak,3935
@@ -72,7 +72,7 @@ model_compression_toolkit/core/common/mixed_precision/mixed_precision_search_man
 model_compression_toolkit/core/common/mixed_precision/solution_refinement_procedure.py,sha256=MY8df-c_kITEr_7hOctaxhdiq29hSTA0La9Qo0oTJJY,9678
 model_compression_toolkit/core/common/mixed_precision/resource_utilization_tools/__init__.py,sha256=Rf1RcYmelmdZmBV5qOKvKWF575ofc06JFQSq83Jz99A,696
 model_compression_toolkit/core/common/mixed_precision/resource_utilization_tools/resource_utilization.py,sha256=PKkhc5q8pEPnNLXwo3U56EOCfYnPXIvPs0LlCGZOoKU,4426
-model_compression_toolkit/core/common/mixed_precision/resource_utilization_tools/resource_utilization_calculator.py,sha256=8f6KDTKD8SzVXDl9jmYJ-p19cQB0Nr_UTdCPuhELTdg,40329
+model_compression_toolkit/core/common/mixed_precision/resource_utilization_tools/resource_utilization_calculator.py,sha256=4Hl4JmrUAJjSNeT1efMTrM4UzHPr8RQeya0OY-6adWY,40304
 model_compression_toolkit/core/common/mixed_precision/resource_utilization_tools/resource_utilization_data.py,sha256=ZY5yFIDzbaqIk0UzakDBObfsVevn4fydqAfAm4RCikY,4058
 model_compression_toolkit/core/common/mixed_precision/search_methods/__init__.py,sha256=sw7LOPN1bM82o3SkMaklyH0jw-TLGK0-fl2Wq73rffI,697
 model_compression_toolkit/core/common/mixed_precision/search_methods/linear_programming.py,sha256=6Z6nQL9UH7B8dbcUR0cuCTEYFOKZAlvOb-SCk_cAZFA,6670
@@ -336,7 +336,7 @@ model_compression_toolkit/exporter/model_exporter/keras/mctq_keras_exporter.py,s
 model_compression_toolkit/exporter/model_exporter/pytorch/__init__.py,sha256=uZ2RigbY9O2PJ0Il8wPpS_s7frgg9WUGd_SHeKGyl1A,699
 model_compression_toolkit/exporter/model_exporter/pytorch/base_pytorch_exporter.py,sha256=9adOGG1nyviNzuL-1aJXyL0c_VQllSZWiG2gR-puywo,6420
 model_compression_toolkit/exporter/model_exporter/pytorch/export_serialization_format.py,sha256=bPevy6OBqng41PqytBR55e6cBEuyrUS0H8dWX4zgjQ4,967
-model_compression_toolkit/exporter/model_exporter/pytorch/fakely_quant_onnx_pytorch_exporter.py,sha256=5S3lyNVc3F62mvS8Q-RTmgQXWI6GWZ5YRvjG4qFy2MM,9520
+model_compression_toolkit/exporter/model_exporter/pytorch/fakely_quant_onnx_pytorch_exporter.py,sha256=1ix8j7rxc1giPjf2PZKwaaCb5pKo0obUvPmRtklmugY,10056
 model_compression_toolkit/exporter/model_exporter/pytorch/fakely_quant_torchscript_pytorch_exporter.py,sha256=ksWV2A-Njo-wAxQ_Ye2sLIZXBWJ_WNyjT7-qFFwvV2o,2897
 model_compression_toolkit/exporter/model_exporter/pytorch/pytorch_export_facade.py,sha256=7xuUrHPMiifn23sWfeiqR9wkYhm8EweDRL_vF-JSxMY,6642
 model_compression_toolkit/exporter/model_wrapper/__init__.py,sha256=7CF2zvpTrIEm8qnbuHnLZyTZkwBBxV24V8QA0oxGbh0,1187
@@ -529,7 +529,7 @@ model_compression_toolkit/xquant/pytorch/model_analyzer.py,sha256=b93o800yVB3Z-i
 model_compression_toolkit/xquant/pytorch/pytorch_report_utils.py,sha256=UVN_S9ULHBEldBpShCOt8-soT8YTQ5oE362y96qF_FA,3950
 model_compression_toolkit/xquant/pytorch/similarity_functions.py,sha256=CERxq5K8rqaiE-DlwhZBTUd9x69dtYJlkHOPLB54vm8,2354
 model_compression_toolkit/xquant/pytorch/tensorboard_utils.py,sha256=mkoEktLFFHtEKzzFRn_jCnxjhJolK12TZ5AQeDHzUO8,9767
-mct_nightly-2.4.0.20250608.655.dist-info/METADATA,sha256=8vPT5m8b4jAczYopmCw7AX6Zkw60YCFVYC26axUCmqA,25087
-mct_nightly-2.4.0.20250608.655.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
-mct_nightly-2.4.0.20250608.655.dist-info/top_level.txt,sha256=gsYA8juk0Z-ZmQRKULkb3JLGdOdz8jW_cMRjisn9ga4,26
-mct_nightly-2.4.0.20250608.655.dist-info/RECORD,,
+mct_nightly-2.4.0.20250609.615.dist-info/METADATA,sha256=QQwkgGOWQt_9w0Xc9uRQrcvJg370QpweeRXfkzForV0,25087
+mct_nightly-2.4.0.20250609.615.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
+mct_nightly-2.4.0.20250609.615.dist-info/top_level.txt,sha256=gsYA8juk0Z-ZmQRKULkb3JLGdOdz8jW_cMRjisn9ga4,26
+mct_nightly-2.4.0.20250609.615.dist-info/RECORD,,

model_compression_toolkit/__init__.py CHANGED Viewed

@@ -27,4 +27,4 @@ from model_compression_toolkit import data_generation
 from model_compression_toolkit import pruning
 from model_compression_toolkit.trainable_infrastructure.keras.load_model import keras_load_quantized_model
-__version__ = "2.4.0.20250608.000655"
+__version__ = "2.4.0.20250609.000615"

model_compression_toolkit/core/common/fusion/fusing_info.py CHANGED Viewed

@@ -39,13 +39,13 @@ class FusingInfo:
     - 'fusing_patterns': The patterns to generate the fused operators from.
     - 'manual_fused_ops': List of sequence of node names to handle as fused ops (even if they are not part of the fusing patterns).
     - `fusing_data`: A dictionary mapping fused operation IDs to lists of nodes that belong to that operation.
-    - `node_to_fused_node_map`: A dictionary mapping each node name to the ID of the fused operation it belongs to.
+    - `node_name_to_fused_op_id`: A dictionary mapping each node name to the ID of the fused operation it belongs to.
     """
     fusing_patterns: List[list[any]] = None
     manual_fused_ops: List[List[str]] = None
     fusing_data: Dict[str, Tuple['BaseNode']] = field(default_factory=dict)
-    node_to_fused_node_map: Dict[str, str] = field(init=False, default_factory=dict)
+    node_name_to_fused_op_id: Dict[str, str] = field(init=False, default_factory=dict)
     fused_op_id_to_quant_config: Dict[str, OpQuantizationConfig] = field(default_factory=dict)
     def __post_init__(self):
@@ -64,10 +64,10 @@ class FusingInfo:
         """
         Init the node-to-fused-node mapping based on the initial fusing data.
         """
-        self.node_to_fused_node_map.clear()
+        self.node_name_to_fused_op_id.clear()
         for op_id, nodes in self.fusing_data.items():
             for node in nodes:
-                self.node_to_fused_node_map[node.name] = op_id
+                self.node_name_to_fused_op_id[node.name] = op_id
     def get_manual_nodes_to_fuse(self) -> List[List[str]]:
         """
@@ -115,7 +115,7 @@ class FusingInfo:
         self.fusing_data[op_id] = nodes
         # Update the mapping for these nodes
         for node in nodes:
-            self.node_to_fused_node_map[node.name] = op_id
+            self.node_name_to_fused_op_id[node.name] = op_id
         # Update the quantization config mapping for this operation
         if self.fusing_patterns is not None:
@@ -152,7 +152,7 @@ class FusingInfo:
             self._manual_fused_ops.remove(node_names)
         for node in nodes:
-            self.node_to_fused_node_map.pop(node.name, None)
+            self.node_name_to_fused_op_id.pop(node.name, None)
         del self.fusing_data[op_id]
         self.fused_op_id_to_quant_config.pop(op_id, None)
@@ -166,7 +166,7 @@ class FusingInfo:
         Returns:
             The name of the fused node containing this node, or None if not fused.
         """
-        return self.node_to_fused_node_map.get(node_name)
+        return self.node_name_to_fused_op_id.get(node_name)
     def get_node_to_fused_node_map(self) -> Dict[str, str]:
         """
@@ -175,7 +175,7 @@ class FusingInfo:
         Returns:
             A dictionary mapping each original node name to its fused node name.
         """
-        return self.node_to_fused_node_map.copy()
+        return self.node_name_to_fused_op_id.copy()
     def get_fusing_quantization_config_map(self) -> Dict[str, OpQuantizationConfig]:
         """
@@ -198,10 +198,12 @@ class FusingInfo:
         """
         return self.fusing_data.get(op_id)
-    def get_nodes_to_disable_activation_quantization(self) -> List['BaseNode']:
+    def get_inner_fln_nodes(self) -> List['BaseNode']:
         """
-        Returns a list of the nodes that their activation quantization is disabled due to fusing.
+        Returns a list of the nodes that are part but not the last node of an FLN.
         """
+        # TODO: the order of the nodes is not gurenteed when returned as dict from get_all_fused_operations -
+        #  then, removing the last one can cause issues
         return [node for nodes in self.get_all_fused_operations().values() for node in nodes[:-1]]
     def get_fused_op_quantization_config(self, op_id: str) -> OpQuantizationConfig:
@@ -228,6 +230,22 @@ class FusingInfo:
         """
         return any(node in nodes for nodes in self.fusing_data.values())
+    def is_quantized_node_in_fln(self, node: 'BaseNode') -> bool:
+        """
+        Check whether a node inside an FLN and should be quantized.
+        Args:
+            node (BaseNode): The node to check.
+        Returns:
+            bool: True if the node is in any fused operation and should be quantized.
+        """
+        if self.is_node_in_fused_op(node):
+            node_q_cfg = self.fused_op_id_to_quant_config[self.node_name_to_fused_op_id[node.name]]
+            return node_q_cfg is not None and node_q_cfg.enable_activation_quantization
+        return False
     def get_all_fused_operations(self) -> Dict[str, Tuple['BaseNode']]:
         """
         Retrieve fused information.
@@ -340,7 +358,7 @@ class FusingInfo:
             for op_id, nodes in self.fusing_data.items()
         )
         mapping_repr = ", ".join(
-            f"{node} -> {op_id}" for node, op_id in self.node_to_fused_node_map.items()
+            f"{node} -> {op_id}" for node, op_id in self.node_name_to_fused_op_id.items()
         )
         return (
             f"FusingInfo(\n"

model_compression_toolkit/core/common/graph/base_graph.py CHANGED Viewed

@@ -908,7 +908,7 @@ class Graph(nx.MultiDiGraph, GraphSearches):
         Disable activation quantization for all nodes in fused operations,
         except for the last node in each fused group.
         """
-        nodes_to_disable = self.fusing_info.get_nodes_to_disable_activation_quantization()
+        nodes_to_disable = self.fusing_info.get_inner_fln_nodes()
         for node in nodes_to_disable:
             for qc in node.candidates_quantization_cfg:
                 qc.activation_quantization_cfg.quant_mode = ActivationQuantizationMode.FLN_QUANT

model_compression_toolkit/core/common/mixed_precision/resource_utilization_tools/resource_utilization_calculator.py CHANGED Viewed

@@ -677,7 +677,7 @@ class ResourceUtilizationCalculator:
         elif target_criterion == TargetInclusionCriterion.AnyQuantizedNonFused:
             nodes = [n for n in nodes if n.is_activation_quantization_enabled() or n.is_quantization_preserving()]
             # remove fused nodes (due to SNC, where the non-linear is quantized, even though it should not be quantized)
-            nodes = [n for n in nodes if n not in self.graph.fusing_info.get_nodes_to_disable_activation_quantization()]
+            nodes = [n for n in nodes if n not in self.graph.fusing_info.get_inner_fln_nodes()]
         elif target_criterion == TargetInclusionCriterion.QNonConfigurable:
             nodes = [n for n in nodes if n.is_activation_quantization_enabled() and not n.has_configurable_activation()]
         elif target_criterion != TargetInclusionCriterion.Any:    # pragma: no cover

model_compression_toolkit/core/common/model_collector.py CHANGED Viewed

@@ -30,7 +30,8 @@ from model_compression_toolkit.core.common.collectors.statistics_collector impor
 def create_stats_collector_for_node(node: common.BaseNode,
-                                    fw_info: FrameworkInfo) -> BaseStatsCollector:
+                                    fw_info: FrameworkInfo,
+                                    quant_node_in_fln: bool) -> BaseStatsCollector:
     """
     Gets a node and a groups list and create and return a statistics collector for a node
     according to whether its statistics should be collected and the prior information we
@@ -44,7 +45,7 @@ def create_stats_collector_for_node(node: common.BaseNode,
         Statistics collector for statistics collection for the node.
     """
-    if node.is_activation_quantization_enabled() or node.is_fln_quantization():
+    if node.is_activation_quantization_enabled() or quant_node_in_fln:
         min_output = getattr(node.prior_info, 'min_output', None)
         max_output = getattr(node.prior_info, 'max_output', None)
         stats_collector = common.StatsCollector(out_channel_axis=fw_info.out_channel_axis_mapping.get(node.type),
@@ -160,7 +161,8 @@ class ModelCollector:
         # Assign statistics collectors to nodes
         for n in graph.get_topo_sorted_nodes():
-            sc = create_stats_collector_for_node(n, fw_info=fw_info)  # Get static collector for the node
+            quant_node_in_fln = n.is_fln_quantization() and graph.fusing_info.is_quantized_node_in_fln(n)
+            sc = create_stats_collector_for_node(n, fw_info=fw_info, quant_node_in_fln=quant_node_in_fln)  # Get static collector for the node
             # If we use bias correction, and the node has kernel weights to quantize, we need to make sure
             # its previous nodes' tensors are consistent with this node.
             kernel_attr = fw_info.get_kernel_op_attributes(n.type)[0]

model_compression_toolkit/exporter/model_exporter/pytorch/fakely_quant_onnx_pytorch_exporter.py CHANGED Viewed

@@ -78,9 +78,18 @@ if FOUND_ONNX:
             act_holder_list = [n for n, m in self.model.named_modules()
                                if isinstance(m, PytorchActivationQuantizationHolder) and
                                m.activation_holder_quantizer.num_bits > 8]
-            for act_holder in act_holder_list:  # pragma: no cover
-                delattr(self.model, act_holder)
-                setattr(self.model, act_holder, torch.nn.Identity())
+            for act_holder in act_holder_list: # pragma: no cover
+                obj = self.model
+                attrs = act_holder.split(".")
+                for a in attrs[:-1]:
+                    obj = getattr(obj, a)
+                if hasattr(obj, attrs[-1]):
+                    delattr(obj, attrs[-1])
+                    setattr(obj, attrs[-1], torch.nn.Identity())
+                else:
+                    Logger.info(f"During removal of activation quantization of a quantizer (with bits > 8) in ONNX FQ "
+                                f"export, deletion of activation holder '{act_holder}' failed — could not locate one or"
+                                f"more intermediate attributes in the path.")
             for layer in self.model.children():
                 self.is_layer_exportable_fn(layer)

{mct_nightly-2.4.0.20250608.655.dist-info → mct_nightly-2.4.0.20250609.615.dist-info}/WHEEL RENAMED Viewed

File without changes

{mct_nightly-2.4.0.20250608.655.dist-info → mct_nightly-2.4.0.20250609.615.dist-info}/licenses/LICENSE.md RENAMED Viewed

File without changes

{mct_nightly-2.4.0.20250608.655.dist-info → mct_nightly-2.4.0.20250609.615.dist-info}/top_level.txt RENAMED Viewed

File without changes

mct-nightly 2.4.0.20250608.655__py3-none-any.whl → 2.4.0.20250609.615__py3-none-any.whl

mct-nightly 2.4.0.20250608.655py3-none-any.whl → 2.4.0.20250609.615py3-none-any.whl