PyPI - mct-nightly - Versions diffs - 2.3.0.20250127.521__py3-none-any.whl → 2.3.0.20250129.508__py3-none-any.whl - Mend

mct-nightly 2.3.0.20250127.521py3-none-any.whl → 2.3.0.20250129.508py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

{mct_nightly-2.3.0.20250127.521.dist-info → mct_nightly-2.3.0.20250129.508.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.2
 Name: mct-nightly
-Version: 2.3.0.20250127.521
+Version: 2.3.0.20250129.508
 Summary: A Model Compression Toolkit for neural networks
 Classifier: Programming Language :: Python :: 3
 Classifier: License :: OSI Approved :: Apache Software License
@@ -13,7 +13,6 @@ Requires-Dist: networkx!=2.8.1
 Requires-Dist: tqdm
 Requires-Dist: Pillow
 Requires-Dist: numpy<2.0
-Requires-Dist: opencv-python
 Requires-Dist: scikit-image
 Requires-Dist: scikit-learn
 Requires-Dist: tensorboard

{mct_nightly-2.3.0.20250127.521.dist-info → mct_nightly-2.3.0.20250129.508.dist-info}/RECORD RENAMED Viewed

@@ -1,14 +1,14 @@
-model_compression_toolkit/__init__.py,sha256=i3_wgr-vg08-FyuHMqsTXicmFTY3B7fJpvoh30Z5zno,1557
+model_compression_toolkit/__init__.py,sha256=5yoBYX4rzT_uWukrdVc6UJm2mlcKu_6gh6agaWOa4-s,1557
 model_compression_toolkit/constants.py,sha256=i_R6uXBfO1ph_X6DNJych2x59SUojfJbn7dNjs_mZnc,3846
 model_compression_toolkit/defaultdict.py,sha256=LSc-sbZYXENMCw3U9F4GiXuv67IKpdn0Qm7Fr11jy-4,2277
-model_compression_toolkit/logger.py,sha256=3DByV41XHRR3kLTJNbpaMmikL8icd9e1N-nkQAY9oDk,4567
+model_compression_toolkit/logger.py,sha256=L3q7tn3Uht0i_7phnlOWMR2Te2zvzrt2HOz9vYEInts,4529
 model_compression_toolkit/metadata.py,sha256=x_Bk4VpzILdsFax6--CZ3X18qUTP28sbF_AhoQW8dNc,4003
 model_compression_toolkit/verify_packages.py,sha256=TlS-K1EP-QsghqWUW7SDPkAJiUf7ryw4tvhFDe6rCUk,1405
 model_compression_toolkit/core/__init__.py,sha256=8a0wUNBKwTdJGDk_Ho6WQAXjGuCqQZG1FUxxJlAV8L8,2096
 model_compression_toolkit/core/analyzer.py,sha256=X-2ZpkH1xdXnISnw1yJvXnvV-ssoUh-9LkLISSWNqiY,3691
 model_compression_toolkit/core/graph_prep_runner.py,sha256=CVTjBaci8F6EP3IKDnRMfxkP-Sv8qY8GpkGt6FyII2U,11376
 model_compression_toolkit/core/quantization_prep_runner.py,sha256=OtL6g2rTC5mfdKrkzm47EPPW-voGGVYMYxpy2_sfu1U,6547
-model_compression_toolkit/core/runner.py,sha256=T3AMorIqKSIQQAdN9XKrqmFBmdXr6H5tVBn5RDgg8as,13876
+model_compression_toolkit/core/runner.py,sha256=iJpDasfs7wtdAelIRaBPxDbN64phPern1O86QDM2HeY,13706
 model_compression_toolkit/core/common/__init__.py,sha256=Wh127PbXcETZX_d1PQqZ71ETK3J9XO5A-HpadGUbj6o,1447
 model_compression_toolkit/core/common/base_substitutions.py,sha256=xDFSmVVs_iFSZfajytI0cuQaNRNcwHX3uqOoHgVUvxQ,1666
 model_compression_toolkit/core/common/framework_implementation.py,sha256=IkMydCj6voau7dwkYLYA_Ka_EFUKP3GKQdpYN6b1fgc,22163
@@ -33,7 +33,7 @@ model_compression_toolkit/core/common/fusion/graph_fuser.py,sha256=b41_4rL_Adiza
 model_compression_toolkit/core/common/fusion/layer_fusing.py,sha256=-2fnjyC9q2RPw9st6RxROW-gdtT2mSRz0QZ_Gz1KDz4,5579
 model_compression_toolkit/core/common/graph/__init__.py,sha256=Xr-Lt_qXMdrCnnOaUS_OJP_3iTTGfPCLf8_vSrQgCs0,773
 model_compression_toolkit/core/common/graph/base_graph.py,sha256=WDyN45Y_wdBR3d5nb-3AX2tsrPxeUtc6GE98xZA-0mY,37818
-model_compression_toolkit/core/common/graph/base_node.py,sha256=dAYaPScFjeBIhwLxJAZQKUFpKwVcdcbmLh9uvw1eU6Q,33042
+model_compression_toolkit/core/common/graph/base_node.py,sha256=_SJBlDIwq5Kt2HLYWIT6POJFnUfrtcOFlOLxTbadJ1w,33058
 model_compression_toolkit/core/common/graph/edge.py,sha256=buoSEUZwilWBK3WeBKpJ-GeDaUA1SDdOHxDpxU_bGpk,3784
 model_compression_toolkit/core/common/graph/functional_node.py,sha256=GH5wStmw8SoAj5IdT_-ItN1Meo_P5NUTt_5bgJC4fak,3935
 model_compression_toolkit/core/common/graph/graph_matchers.py,sha256=CrDoHYq4iPaflgJWmoJ1K4ziLrRogJvFTVWg8P0UcDU,4744
@@ -73,7 +73,7 @@ model_compression_toolkit/core/common/mixed_precision/set_layer_to_bitwidth.py,s
 model_compression_toolkit/core/common/mixed_precision/solution_refinement_procedure.py,sha256=8oAFJc_KC3z5ClI-zo4KC40kKGscyixUc5oYP4j4cMo,8019
 model_compression_toolkit/core/common/mixed_precision/resource_utilization_tools/__init__.py,sha256=Rf1RcYmelmdZmBV5qOKvKWF575ofc06JFQSq83Jz99A,696
 model_compression_toolkit/core/common/mixed_precision/resource_utilization_tools/resource_utilization.py,sha256=T5yVr7lay-6QLuTDBZNI1Ufj02EMBWuY_yHjC8eHx5I,3998
-model_compression_toolkit/core/common/mixed_precision/resource_utilization_tools/resource_utilization_calculator.py,sha256=qdnkkviZZFYqFuRY7o0US_ihH1Iq-X-eG7OwiTVsRBU,34937
+model_compression_toolkit/core/common/mixed_precision/resource_utilization_tools/resource_utilization_calculator.py,sha256=DyiE84ECgwtaCATWcisv-7ndmBUbj_TaddZ7GeIjlrU,35307
 model_compression_toolkit/core/common/mixed_precision/resource_utilization_tools/resource_utilization_data.py,sha256=J7gqUGs4ITo4ufl84A5vACxm670LG6RhQyXkejfpbn8,8834
 model_compression_toolkit/core/common/mixed_precision/search_methods/__init__.py,sha256=sw7LOPN1bM82o3SkMaklyH0jw-TLGK0-fl2Wq73rffI,697
 model_compression_toolkit/core/common/mixed_precision/search_methods/linear_programming.py,sha256=uhC0az5OVSfeYexcasoy0cT8ZOonFKIedk_1U-ZPLhA,17171
@@ -104,7 +104,7 @@ model_compression_toolkit/core/common/quantization/candidate_node_quantization_c
 model_compression_toolkit/core/common/quantization/core_config.py,sha256=yxCzWqldcHoe8GGxrH0tp99bhrc5jDT7SgZftnMUUBE,2374
 model_compression_toolkit/core/common/quantization/debug_config.py,sha256=zJP2W9apUPX9RstpPWWK71wr9xJsg7j-s7lGV4_bQdc,1510
 model_compression_toolkit/core/common/quantization/filter_nodes_candidates.py,sha256=IHVX-Gdekru4xLuDTgcsp_JCnRtuVWnbYsDBQuSXTKc,7079
-model_compression_toolkit/core/common/quantization/node_quantization_config.py,sha256=HctuRvQsT6Dx9A3lLiLEijghPftM-iABcjmDShlPAn4,26527
+model_compression_toolkit/core/common/quantization/node_quantization_config.py,sha256=teDclY8WmuVqqa9Fgr6WY-7ILDep0QKzKxoZCKzBG2k,26960
 model_compression_toolkit/core/common/quantization/quantization_config.py,sha256=UkSVW7d1OF_Px9gAjsqqK65aYhIBFWaBO-_IH6_AFfg,4403
 model_compression_toolkit/core/common/quantization/quantization_fn_selection.py,sha256=HfBkSiRTOf9mNF-TNQHTCCs3xSg66F20no0O6vl5v1Y,2154
 model_compression_toolkit/core/common/quantization/quantization_params_fn_selection.py,sha256=7eG7dl1TcbdnHwgmvyjarxLs0o6Lw_9VAjXAm4rsiBk,3791
@@ -312,7 +312,7 @@ model_compression_toolkit/data_generation/pytorch/pytorch_data_generation.py,sha
 model_compression_toolkit/data_generation/pytorch/optimization_functions/__init__.py,sha256=huHoBUcKNB6BnY6YaUCcFvdyBtBI172ZoUD8ZYeNc6o,696
 model_compression_toolkit/data_generation/pytorch/optimization_functions/batchnorm_alignment_functions.py,sha256=dMc4zz9XfYfAT4Cxns57VgvGZWPAMfaGlWLFyCyl8TA,1968
 model_compression_toolkit/data_generation/pytorch/optimization_functions/bn_layer_weighting_functions.py,sha256=We0fVMQ4oU7Y0IWQ8fKy8KpqkIiLyKoQeF9XKAQ6TH0,3317
-model_compression_toolkit/data_generation/pytorch/optimization_functions/image_initilization.py,sha256=hhWSZ7w45dE5SQ6jM27cBkCSJObWkALs_RpD6afPi68,4753
+model_compression_toolkit/data_generation/pytorch/optimization_functions/image_initilization.py,sha256=0mV2BuegNvL9MnDBu2NiJo--4KCcdDDzbWUMU4uld5w,4678
 model_compression_toolkit/data_generation/pytorch/optimization_functions/lr_scheduler.py,sha256=NydGxFIclmrfU3HWYUrRbprg4hPt470QP6MTOMLEhRs,9172
 model_compression_toolkit/data_generation/pytorch/optimization_functions/output_loss_functions.py,sha256=PRVmn8o2hTdwTdbd2ezf__LNbFvcgiVO0c25dsyg3Tg,6549
 model_compression_toolkit/data_generation/pytorch/optimization_functions/scheduler_step_functions.py,sha256=zMjY2y4FSHonuY5hddbMTb8qAQtLtohYF7q1wuruDDs,3267
@@ -523,8 +523,8 @@ model_compression_toolkit/xquant/pytorch/model_analyzer.py,sha256=b93o800yVB3Z-i
 model_compression_toolkit/xquant/pytorch/pytorch_report_utils.py,sha256=UVN_S9ULHBEldBpShCOt8-soT8YTQ5oE362y96qF_FA,3950
 model_compression_toolkit/xquant/pytorch/similarity_functions.py,sha256=CERxq5K8rqaiE-DlwhZBTUd9x69dtYJlkHOPLB54vm8,2354
 model_compression_toolkit/xquant/pytorch/tensorboard_utils.py,sha256=mkoEktLFFHtEKzzFRn_jCnxjhJolK12TZ5AQeDHzUO8,9767
-mct_nightly-2.3.0.20250127.521.dist-info/LICENSE.md,sha256=aYSSIb-5AFPeITTvXm1UAoe0uYBiMmSS8flvXaaFUks,10174
-mct_nightly-2.3.0.20250127.521.dist-info/METADATA,sha256=ZhEsvuco-uGyjmQ-dWuDtpCgGFllAcujWNiGhzowOjI,26601
-mct_nightly-2.3.0.20250127.521.dist-info/WHEEL,sha256=In9FTNxeP60KnTkGw7wk6mJPYd_dQSjEZmXdBdMCI-8,91
-mct_nightly-2.3.0.20250127.521.dist-info/top_level.txt,sha256=gsYA8juk0Z-ZmQRKULkb3JLGdOdz8jW_cMRjisn9ga4,26
-mct_nightly-2.3.0.20250127.521.dist-info/RECORD,,
+mct_nightly-2.3.0.20250129.508.dist-info/LICENSE.md,sha256=aYSSIb-5AFPeITTvXm1UAoe0uYBiMmSS8flvXaaFUks,10174
+mct_nightly-2.3.0.20250129.508.dist-info/METADATA,sha256=V1ZMks36vbn2kcBLkb88KKI-viLM_xXXWWIPogCNTnI,26572
+mct_nightly-2.3.0.20250129.508.dist-info/WHEEL,sha256=In9FTNxeP60KnTkGw7wk6mJPYd_dQSjEZmXdBdMCI-8,91
+mct_nightly-2.3.0.20250129.508.dist-info/top_level.txt,sha256=gsYA8juk0Z-ZmQRKULkb3JLGdOdz8jW_cMRjisn9ga4,26
+mct_nightly-2.3.0.20250129.508.dist-info/RECORD,,

model_compression_toolkit/__init__.py CHANGED Viewed

@@ -27,4 +27,4 @@ from model_compression_toolkit import data_generation
 from model_compression_toolkit import pruning
 from model_compression_toolkit.trainable_infrastructure.keras.load_model import keras_load_quantized_model
-__version__ = "2.3.0.20250127.000521"
+__version__ = "2.3.0.20250129.000508"

model_compression_toolkit/core/common/graph/base_node.py CHANGED Viewed

@@ -30,6 +30,9 @@ from model_compression_toolkit.target_platform_capabilities.targetplatform2frame
     FrameworkQuantizationCapabilities
+WeightAttrT = Union[str, int]
 class BaseNode:
     """
     Class to represent a node in a graph that represents the model.
@@ -40,7 +43,7 @@ class BaseNode:
                  framework_attr: Dict[str, Any],
                  input_shape: Tuple[Any],
                  output_shape: Tuple[Any],
-                 weights: Dict[Union[str, int], np.ndarray],
+                 weights: Dict[WeightAttrT, np.ndarray],
                  layer_class: type,
                  reuse: bool = False,
                  reuse_group: str = None,
@@ -189,7 +192,7 @@ class BaseNode:
         """
         return self.reuse or self.reuse_group is not None
-    def _get_weight_name(self, name: Union[str, int]) -> List[Union[str, int]]:
+    def _get_weight_name(self, name: WeightAttrT) -> List[WeightAttrT]:
         """
         Get weight names that match argument name (either string weights or integer for
         positional weights).
@@ -203,7 +206,7 @@ class BaseNode:
         return [k for k in self.weights.keys()
                 if (isinstance(k, int) and name == k) or (isinstance(k, str) and name in k)]
-    def get_weights_by_keys(self, name: Union[str, int]) -> np.ndarray:
+    def get_weights_by_keys(self, name: WeightAttrT) -> np.ndarray:
         """
         Get a node's weight by its name.
         Args:

model_compression_toolkit/core/common/mixed_precision/resource_utilization_tools/resource_utilization_calculator.py CHANGED Viewed

@@ -15,13 +15,14 @@
 from collections import defaultdict
 from copy import deepcopy
 from enum import Enum, auto
-from typing import Dict, NamedTuple, Optional, Tuple, List, Iterable, Union, Literal, Sequence, Set
+from typing import Dict, NamedTuple, Optional, Tuple, List, Iterable, Union, Literal, Sequence
 from model_compression_toolkit.logger import Logger
 from model_compression_toolkit.constants import FLOAT_BITWIDTH
 from model_compression_toolkit.core import FrameworkInfo
 from model_compression_toolkit.core.common import Graph, BaseNode
 from model_compression_toolkit.core.common.framework_implementation import FrameworkImplementation
+from model_compression_toolkit.core.common.graph.base_node import WeightAttrT
 from model_compression_toolkit.core.common.graph.edge import EDGE_SINK_INDEX
 from model_compression_toolkit.core.common.graph.memory_graph.compute_graph_max_cut import compute_graph_max_cut
 from model_compression_toolkit.core.common.graph.memory_graph.cut import Cut
@@ -79,24 +80,25 @@ class Utilization(NamedTuple):
       bytes: memory utilization.
     """
     size: int
-    bytes: Optional[float]
+    bytes: float
     def __add__(self, other: 'Utilization') -> 'Utilization':
+        """ Add another Utilization object. """
         return Utilization(self.size + other.size, self.bytes + other.bytes)
-    def __radd__(self, other: Union['Utilization', Literal[0]]):
-        # Needed for sum (with default start_value=0).
-        if other == 0:
-            return self
-        return self + other    # pragma: no cover
+    def __radd__(self, other: Literal[0]):
+        """ Right add is only supported with 0 to allow the sum operator (with the default start_value=0) """
+        if other != 0:
+            raise ValueError('radd is only supported with 0')
+        return self
     def __gt__(self, other: 'Utilization'):
-        # Needed for max. Compare by bytes.
+        """ Greater than operator by bytes. Needed for max. """
         return self.bytes > other.bytes
     def __lt__(self, other: 'Utilization'):
-        # Needed for min. Compare by bytes.
-        return self.bytes < other.bytes    # pragma: no cover
+        """ Less than operator by bytes. Needed for min. """
+        return self.bytes < other.bytes
 class ResourceUtilizationCalculator:
@@ -107,6 +109,8 @@ class ResourceUtilizationCalculator:
         BitwidthMode.QMinBit: min,
     }
+    unexpected_qc_error = 'Custom quantization configuration is not expected for non-custom bit mode.'
     def __init__(self, graph: Graph, fw_impl: FrameworkImplementation, fw_info: FrameworkInfo):
         self.graph = graph
         self.fw_impl = fw_impl
@@ -118,17 +122,17 @@ class ResourceUtilizationCalculator:
         self._params_cnt = {}
         for n in graph.nodes:
             self._act_tensors_size[n] = n.get_total_output_params()
-            self._params_cnt[n] = {k: v.size for k, v in n.weights.items()}
+            if n.weights:
+                self._params_cnt[n] = {k: v.size for k, v in n.weights.items()}
         self._cuts: Optional[Dict[Cut, List[BaseNode]]] = None
     @property
     def cuts(self) -> Dict[Cut, List[BaseNode]]:
         """ Compute if needed and return graph cuts and their memory element nodes. """
         if self._cuts is None:
-            memory_graph = MemoryGraph(deepcopy(self.graph))
-            _, _, cuts = compute_graph_max_cut(memory_graph)
+            cuts = self._compute_cuts()
             if cuts is None:    # pragma: no cover
-                raise RuntimeError("Failed to calculate activation memory cuts for graph.")  # pragma: no cover
+                raise RuntimeError("Failed to calculate activation memory cuts for graph.")
             cuts = [cut for cut in cuts if cut.mem_elements.elements]
             # cache cuts nodes for future use, so do not filter by target
             self._cuts = {cut: [self.graph.find_node_by_name(m.node_name)[0] for m in cut.mem_elements.elements]
@@ -140,7 +144,8 @@ class ResourceUtilizationCalculator:
                                      bitwidth_mode: BitwidthMode,
                                      act_qcs: Optional[Dict[BaseNode, NodeActivationQuantizationConfig]] = None,
                                      w_qcs: Optional[Dict[BaseNode, NodeWeightsQuantizationConfig]] = None,
-                                     ru_targets: Iterable[RUTarget] = None) -> ResourceUtilization:
+                                     ru_targets: Iterable[RUTarget] = None,
+                                     allow_unused_qcs: bool = False) -> ResourceUtilization:
         """
         Compute network's resource utilization.
@@ -154,16 +159,26 @@ class ResourceUtilizationCalculator:
               In custom mode, must provide configuration for all configurable weights. For non-configurable
               weights, if not provided, the default configuration will be extracted from the node.
             ru_targets: metrics to include for computation. If None, all metrics are calculated.
+            allow_unused_qcs: by default, if custom quantization configs are passed, but are not going to be used for
+              any of the requested targets, an error is raised. To disable the validation, pass True.
         Returns:
             Resource utilization object.
         """
         ru_targets = set(ru_targets) if ru_targets else set(RUTarget)
-        if w_qcs is not None and not self.is_custom_weights_config_applicable(ru_targets):
-            raise ValueError('Weight configuration passed but no relevant metric requested.')
-        if act_qcs is not None and not self.is_custom_activation_config_applicable(ru_targets):
-            raise ValueError('Activation configuration passed but no relevant metric requested.')
+        if (w_qcs or act_qcs) and bitwidth_mode != BitwidthMode.QCustom:
+            raise ValueError(self.unexpected_qc_error)
+        if w_qcs and not {RUTarget.WEIGHTS, RUTarget.TOTAL, RUTarget.BOPS}.intersection(ru_targets):
+            if not allow_unused_qcs:
+                raise ValueError('Weight configuration passed but no relevant ru_targets requested.')
+            w_qcs = None
+        if act_qcs and not {RUTarget.ACTIVATION, RUTarget.TOTAL, RUTarget.BOPS}.intersection(ru_targets):
+            if not allow_unused_qcs:
+                raise ValueError('Activation configuration passed but no relevant ru_targets requested.')
+            act_qcs = None
         w_total, a_total = None, None
         if {RUTarget.WEIGHTS, RUTarget.TOTAL}.intersection(ru_targets):
@@ -180,8 +195,7 @@ class ResourceUtilizationCalculator:
         if RUTarget.TOTAL in ru_targets:
             ru.total_memory = w_total + a_total
         if RUTarget.BOPS in ru_targets:
-            ru.bops, _ = self.compute_bops(target_criterion=target_criterion,
-                                           bitwidth_mode=bitwidth_mode, act_qcs=act_qcs, w_qcs=w_qcs)
+            ru.bops, _ = self.compute_bops(target_criterion, bitwidth_mode, act_qcs=act_qcs, w_qcs=w_qcs)
         assert ru.get_restricted_targets() == set(ru_targets), 'Mismatch between the number of requested and computed metrics'
         return ru
@@ -206,35 +220,35 @@ class ResourceUtilizationCalculator:
             - Per node total weights utilization. Dict keys are nodes in a topological order.
             - Detailed per node per weight attribute utilization. Dict keys are nodes in a topological order.
         """
-        nodes = self._get_target_weight_nodes(target_criterion, include_reused=False)
-        if not nodes:
-            return 0, {}, {}
+        if w_qcs and bitwidth_mode != BitwidthMode.QCustom:
+            raise ValueError(self.unexpected_qc_error)
+        node_attrs = self._collect_target_nodes_w_attrs(target_criterion, include_reused=False)
         util_per_node: Dict[BaseNode, Utilization] = {}
         util_per_node_per_weight = {}
-        for n in self._topo_sort(nodes):
+        for n in self._topo_sort(list(node_attrs.keys())):
             w_qc = w_qcs.get(n) if w_qcs else None
-            node_weights_util, per_weight_util = self.compute_node_weights_utilization(n, target_criterion,
+            node_weights_util, per_weight_util = self.compute_node_weights_utilization(n, node_attrs[n],
                                                                                        bitwidth_mode, w_qc)
             util_per_node[n] = node_weights_util
             util_per_node_per_weight[n] = per_weight_util
-        total_util = sum(util_per_node.values())
+        total_util = sum(util_per_node.values()) if util_per_node else Utilization(0, 0)
         return total_util.bytes, util_per_node, util_per_node_per_weight
     def compute_node_weights_utilization(self,
                                          n: BaseNode,
-                                         target_criterion: TargetInclusionCriterion,
+                                         target_criterion: Union[TargetInclusionCriterion, List[str]],
                                          bitwidth_mode: BitwidthMode,
-                                         qc: NodeWeightsQuantizationConfig)\
+                                         qc: Optional[NodeWeightsQuantizationConfig] = None)\
             -> Tuple[Utilization, Dict[str, Utilization]]:
         """
         Compute resource utilization for weights of a node.
         Args:
             n: node.
-            target_criterion: criterion to include weights for computation.
+            target_criterion: criterion to include weights for computation, or explicit attributes list (full names).
             bitwidth_mode: bit-width mode for the computation.
             qc: custom weights quantization configuration. Should be provided for custom bit mode only.
               In custom mode, must provide configuration for all configurable weights. For non-configurable
@@ -244,9 +258,21 @@ class ResourceUtilizationCalculator:
             - Node's total weights utilization.
             - Detailed per weight attribute utilization.
         """
-        weight_attrs = self._get_target_weight_attrs(n, target_criterion)
-        if not weight_attrs:    # pragma: no cover
-            return Utilization(0, 0), {}
+        if qc:
+            if bitwidth_mode != BitwidthMode.QCustom:
+                raise ValueError(self.unexpected_qc_error)
+            if set(qc.all_weight_attrs) - set(n.get_node_weights_attributes()):
+                raise ValueError(f'Custom configuration contains unexpected weight attrs {qc.all_weight_attrs} for '
+                                 f'node {n} containing weight attrs {n.get_node_weights_attributes()}.')
+        # If target criterion is passed, weights_attrs may return empty, that's fine.
+        # However, if an explicit list is passed, it must be non-empty.
+        if isinstance(target_criterion, TargetInclusionCriterion):
+            weight_attrs = self._get_target_weight_attrs(n, target_criterion)
+        else:
+            weight_attrs = target_criterion
+            if not weight_attrs:
+                raise ValueError('Explicit list of attributes to compute cannot be empty.')
         attr_util = {}
         for attr in weight_attrs:
@@ -255,7 +281,7 @@ class ResourceUtilizationCalculator:
             bytes_ = size * nbits / 8
             attr_util[attr] = Utilization(size, bytes_)
-        total_weights: Utilization = sum(attr_util.values())    # type: ignore
+        total_weights: Utilization = sum(attr_util.values()) if attr_util else Utilization(0, 0)
         return total_weights, attr_util
     def compute_activations_utilization(self,
@@ -280,7 +306,7 @@ class ResourceUtilizationCalculator:
     def compute_activation_utilization_by_cut(self,
                                               target_criterion: TargetInclusionCriterion,
                                               bitwidth_mode: BitwidthMode,
-                                              act_qcs: Optional[Dict[BaseNode, NodeActivationQuantizationConfig]]) \
+                                              act_qcs: Optional[Dict[BaseNode, NodeActivationQuantizationConfig]] = None) \
             -> Tuple[float, Dict[Cut, Utilization], Dict[Cut, Dict[BaseNode, Utilization]]]:
         """
         Compute graph activation cuts utilization.
@@ -297,15 +323,15 @@ class ResourceUtilizationCalculator:
             - Total activation utilization per cut.
             - Detailed activation utilization per cut per node.
         """
-        if target_criterion != TargetInclusionCriterion.AnyQuantized:    # pragma: no cover
-            raise NotImplementedError('Computing MaxCut activation utilization is currently only supported for quantized targets.')
+        if act_qcs and not bitwidth_mode == BitwidthMode.QCustom:
+            raise ValueError(self.unexpected_qc_error)
         graph_target_nodes = self._get_target_activation_nodes(target_criterion, include_reused=True)
         # if there are no target activations in the graph, don't waste time looking for cuts
         if not graph_target_nodes:
             return 0, {}, {}
-        util_per_cut: Dict[Cut, Utilization] = {}    # type: ignore
+        util_per_cut: Dict[Cut, Utilization] = {}
         util_per_cut_per_node = defaultdict(dict)
         for cut in self.cuts:
             cut_target_nodes = self._get_cut_target_nodes(cut, target_criterion)
@@ -325,7 +351,7 @@ class ResourceUtilizationCalculator:
                                                bitwidth_mode: BitwidthMode,
                                                act_qcs: Optional[Dict[BaseNode, NodeActivationQuantizationConfig]] = None,
                                                include_reused=False) \
-            -> Tuple[float, Dict[BaseNode, Utilization]]:    # pragma: no cover
+            -> Tuple[float, Dict[BaseNode, Utilization]]:
         """
         Compute resource utilization for graph's activations tensors.
@@ -341,9 +367,10 @@ class ResourceUtilizationCalculator:
             - Detailed utilization per node. Dict keys are nodes in a topological order.
         """
+        if act_qcs and bitwidth_mode != BitwidthMode.QCustom:
+            raise ValueError(self.unexpected_qc_error)
         nodes = self._get_target_activation_nodes(target_criterion, include_reused=include_reused)
-        if not nodes:
-            return 0, {}
         util_per_node: Dict[BaseNode, Utilization] = {}
         for n in self._topo_sort(nodes):
@@ -351,14 +378,14 @@ class ResourceUtilizationCalculator:
             util = self.compute_node_activation_tensor_utilization(n, None, bitwidth_mode, qc)
             util_per_node[n] = util
-        total_util = max(util_per_node.values())
-        return total_util.bytes, util_per_node
+        total_util = max(util_per_node.values()).bytes if util_per_node else 0
+        return total_util, util_per_node
     def compute_node_activation_tensor_utilization(self,
                                                    n: BaseNode,
                                                    target_criterion: Optional[TargetInclusionCriterion],
                                                    bitwidth_mode: BitwidthMode,
-                                                   qc: Optional[NodeActivationQuantizationConfig]) -> Utilization:
+                                                   qc: Optional[NodeActivationQuantizationConfig] = None) -> Utilization:
         """
         Compute activation resource utilization for a node.
@@ -372,9 +399,13 @@ class ResourceUtilizationCalculator:
         Returns:
             Node's activation utilization.
         """
+        if qc and bitwidth_mode != BitwidthMode.QCustom:
+            raise ValueError(self.unexpected_qc_error)
         if target_criterion:
+            # only check whether the node meets the criterion
             nodes = self._get_target_activation_nodes(target_criterion=target_criterion, include_reused=True, nodes=[n])
-            if not nodes:    # pragma: no cover
+            if not nodes:
                 return Utilization(0, 0)
         size = self._act_tensors_size[n]
@@ -410,7 +441,7 @@ class ResourceUtilizationCalculator:
         if target_criterion != TargetInclusionCriterion.AnyQuantized:    # pragma: no cover
             raise NotImplementedError('BOPS computation is currently only supported for quantized targets.')
-        nodes = self._get_target_weight_nodes(target_criterion, include_reused=True)
+        nodes = self._collect_target_nodes_w_attrs(target_criterion, include_reused=True)
         # filter out nodes with only positional weights # TODO add as arg to get target nodes
         nodes = [n for n in nodes if n.has_kernel_weight_to_quantize(self.fw_info)]
@@ -448,7 +479,7 @@ class ResourceUtilizationCalculator:
         incoming_edges = self.graph.incoming_edges(n, sort_by_attr=EDGE_SINK_INDEX)
         # TODO temporary adding this for const_representation test in torch which has Linear with const input
-        if not incoming_edges:
+        if not incoming_edges:    # pragma: no cover
             return 0
         assert len(incoming_edges) == 1, \
             f'Unexpected number of inputs {len(incoming_edges)} for BOPS calculation. Expected 1.'
@@ -465,13 +496,11 @@ class ResourceUtilizationCalculator:
         node_bops = a_nbits * w_nbits * node_mac
         return node_bops
-    def is_custom_weights_config_applicable(self, ru_targets: Set[RUTarget]) -> bool:
-        """ Whether custom configuration for weights is compatible with the requested targets."""
-        return bool({RUTarget.WEIGHTS, RUTarget.TOTAL, RUTarget.BOPS}.intersection(ru_targets))
-    def is_custom_activation_config_applicable(self, ru_targets: Set[RUTarget]) -> bool:
-        """ Whether custom configuration for activations is compatible with the requested targets."""
-        return bool({RUTarget.ACTIVATION, RUTarget.TOTAL, RUTarget.BOPS}.intersection(ru_targets))
+    def _compute_cuts(self):
+        """ Compute activation cuts of the graph. """
+        memory_graph = MemoryGraph(deepcopy(self.graph))
+        _, _, cuts = compute_graph_max_cut(memory_graph)
+        return cuts
     def _get_cut_target_nodes(self, cut: Cut, target_criterion: TargetInclusionCriterion) -> List[BaseNode]:
         """
@@ -487,37 +516,23 @@ class ResourceUtilizationCalculator:
         cut_nodes = self.cuts[cut]
         return self._get_target_activation_nodes(target_criterion, include_reused=True, nodes=cut_nodes)
-    def _get_target_weight_nodes(self,
-                                 target_criterion: TargetInclusionCriterion,
-                                 include_reused: bool) -> List[BaseNode]:
+    def _collect_target_nodes_w_attrs(self,
+                                      target_criterion: TargetInclusionCriterion,
+                                      include_reused: bool) -> Dict[BaseNode, List[WeightAttrT]]:
         """
-        Collect nodes to include in weights utilization computation.
+        Collect nodes and their weight attributes to include in weights utilization computation.
         Args:
             target_criterion: criterion to include weights for computation.
             include_reused: whether to include reused nodes.
         Returns:
-            Target nodes.
+            A mapping from nodes to their weights attributes.
         """
-        if target_criterion == TargetInclusionCriterion.QConfigurable:
-            nodes = self.graph.get_weights_configurable_nodes(self.fw_info, include_reused_nodes=include_reused)
-        elif target_criterion == TargetInclusionCriterion.AnyQuantized:
-            nodes = [n for n in self.graph if n.has_any_weight_attr_to_quantize()]
-        elif target_criterion == TargetInclusionCriterion.QNonConfigurable:
-            # TODO this is wrong. Need to look at specific weights and not the whole node (if w1 is configurable and w2
-            #  is non-configurable we want to discover the node both as configurable and non-configurable)
-            quantized = [n for n in self.graph if n.has_any_weight_attr_to_quantize()]
-            configurable = self.graph.get_weights_configurable_nodes(self.fw_info, include_reused_nodes=include_reused)
-            nodes = [n for n in quantized if n not in configurable]
-        elif target_criterion == TargetInclusionCriterion.Any:    # pragma: no cover
-            nodes = list(self.graph.nodes)
-        else:    # pragma: no cover
-            raise ValueError(f'Unknown {target_criterion}.')
-        if not include_reused:
-            nodes = [n for n in nodes if not n.reuse]
-        return nodes
+        nodes_attrs = {n: attrs for n in self.graph.nodes
+                       if (attrs := self._get_target_weight_attrs(n, target_criterion))
+                           and (include_reused or not n.reuse)}
+        return nodes_attrs
     def _get_target_weight_attrs(self, n: BaseNode, target_criterion: TargetInclusionCriterion) -> List[str]:
         """
@@ -530,6 +545,7 @@ class ResourceUtilizationCalculator:
         Returns:
             Selected weight attributes names.
         """
+        # weight_attrs are the full names in the layer, e.g. 'conv2d_1/kernel:0' (or an integer for positional attrs)
         weight_attrs = n.get_node_weights_attributes()
         if target_criterion == TargetInclusionCriterion.QConfigurable:
             weight_attrs = [attr for attr in weight_attrs if n.is_configurable_weight(attr)]
@@ -548,14 +564,17 @@ class ResourceUtilizationCalculator:
         Sort nodes in a topological order (based on graph's nodes).
         Args:
-            nodes: nodes to sort.
+            nodes: nodes to sort. Allowed to be empty.
         Returns:
             Nodes in topological order.
         """
+        if not nodes:
+            return list(nodes)
         graph_topo_nodes = self.graph.get_topo_sorted_nodes()
         topo_nodes = [n for n in graph_topo_nodes if n in nodes]
-        if len(topo_nodes) != len(nodes):    # pragma: no cover
+        if len(topo_nodes) != len(nodes):
             missing_nodes = [n for n in nodes if n not in topo_nodes]
             raise ValueError(f'Could not topo-sort, nodes {missing_nodes} do not match the graph nodes.')
         return topo_nodes
@@ -576,15 +595,15 @@ class ResourceUtilizationCalculator:
             Selected nodes.
         """
         nodes = nodes or self.graph.nodes
-        if target_criterion == TargetInclusionCriterion.QConfigurable:    # pragma: no cover
+        if target_criterion == TargetInclusionCriterion.QConfigurable:
             nodes = [n for n in nodes if n.has_configurable_activation()]
         elif target_criterion == TargetInclusionCriterion.AnyQuantized:
             nodes = [n for n in nodes if n.is_activation_quantization_enabled()]
-        elif target_criterion == TargetInclusionCriterion.QNonConfigurable:    # pragma: no cover
+        elif target_criterion == TargetInclusionCriterion.QNonConfigurable:
             nodes = [n for n in nodes if n.is_activation_quantization_enabled() and not n.has_configurable_activation()]
         elif target_criterion != TargetInclusionCriterion.Any:    # pragma: no cover
             raise ValueError(f'Unknown {target_criterion}.')
-        if not include_reused:    # pragma: no cover
+        if not include_reused:
             nodes = [n for n in nodes if not n.reuse]
         return nodes
@@ -607,8 +626,7 @@ class ResourceUtilizationCalculator:
             Activation bit-width.
         """
         if act_qc:
-            if bitwidth_mode != BitwidthMode.QCustom:    # pragma: no cover
-                raise ValueError(f'Activation config is not expected for non-custom bit mode {bitwidth_mode}')
+            assert bitwidth_mode == BitwidthMode.QCustom
             return act_qc.activation_n_bits if act_qc.enable_activation_quantization else FLOAT_BITWIDTH
         if bitwidth_mode == BitwidthMode.Float or not n.is_activation_quantization_enabled():
@@ -623,8 +641,8 @@ class ResourceUtilizationCalculator:
         if bitwidth_mode in [BitwidthMode.QCustom, BitwidthMode.QDefaultSP]:
             qcs = n.get_unique_activation_candidates()
-            if len(qcs) != 1:    # pragma: no cover
-                raise ValueError(f'Could not retrieve the activation quantization candidate for node {n.name} '
+            if len(qcs) != 1:
+                raise ValueError(f'Could not retrieve the activation quantization candidate for node {n} '
                                  f'as it has {len(qcs)}!=1 unique candidates .')
             return qcs[0].activation_quantization_cfg.activation_n_bits
@@ -650,9 +668,8 @@ class ResourceUtilizationCalculator:
         Returns:
             Weight bit-width.
         """
+        assert not (w_qc and bitwidth_mode != BitwidthMode.QCustom)
         if w_qc and w_qc.has_attribute_config(w_attr):
-            if bitwidth_mode != BitwidthMode.QCustom:    # pragma: no cover
-                raise ValueError('Weight config is not expected for non-custom bit mode {bitwidth_mode}')
             attr_cfg = w_qc.get_attr_config(w_attr)
             return attr_cfg.weights_n_bits if attr_cfg.enable_weights_quantization else FLOAT_BITWIDTH
@@ -669,9 +686,9 @@ class ResourceUtilizationCalculator:
         if bitwidth_mode in [BitwidthMode.QCustom, BitwidthMode.QDefaultSP]:
             # if configuration was not passed and the weight has only one candidate, use it
-            if len(w_qcs) != 1:    # pragma: no cover
-                raise ValueError(f'Could not retrieve the quantization candidate for attr {w_attr} of node {n.name} '
-                                 f'as it {len(w_qcs)}!=1 unique candidates.')
+            if len(w_qcs) != 1:
+                raise ValueError(f'Could not retrieve the quantization candidate for attr {w_attr} of node {n} '
+                                 f'as it has {len(w_qcs)}!=1 unique candidates.')
             return w_qcs[0].weights_n_bits
         raise ValueError(f'Unknown mode {bitwidth_mode.name}')    # pragma: no cover

model_compression_toolkit/core/common/quantization/node_quantization_config.py CHANGED Viewed

@@ -14,7 +14,7 @@
 # ==============================================================================
-from typing import Callable, Any, List, Tuple, Union, Dict
+from typing import Callable, Any, List, Tuple, Union, Dict, TYPE_CHECKING
 import numpy as np
@@ -28,6 +28,8 @@ from model_compression_toolkit.core.common.quantization.quantization_config impo
 from model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema import AttributeQuantizationConfig, \
     OpQuantizationConfig
+if TYPE_CHECKING:
+    from model_compression_toolkit.core.common.graph.base_node import WeightAttrT
 ##########################################
 # Every node holds a quantization configuration
@@ -482,6 +484,15 @@ class NodeWeightsQuantizationConfig(BaseNodeQuantizationConfig):
         return False
+    @property
+    def all_weight_attrs(self) -> List['WeightAttrT']:
+        """ Fetch all weight attributes keys (positional and named).
+            Returns:
+                List of attributes.
+        """
+        return list(self.pos_attributes_config_mapping.keys()) + list(self.attributes_config_mapping.keys())
     def _extract_config_for_attributes_with_name(self, attr_name) -> Dict[str, WeightsAttrQuantizationConfig]:
         """
         Extract the saved attributes that contain the given attribute name.

model_compression_toolkit/core/runner.py CHANGED Viewed

@@ -229,14 +229,11 @@ def _set_final_resource_utilization(graph: Graph,
     final_ru = None
     if ru_targets:
         ru_calculator = ResourceUtilizationCalculator(graph, fw_impl, fw_info)
-        w_qcs, a_qcs = None, None
-        if ru_calculator.is_custom_weights_config_applicable(ru_targets):
-            w_qcs = {n: n.final_weights_quantization_cfg for n in graph.nodes}
-        if ru_calculator.is_custom_activation_config_applicable(ru_targets):
-            a_qcs = {n: n.final_activation_quantization_cfg for n in graph.nodes}
+        w_qcs = {n: n.final_weights_quantization_cfg for n in graph.nodes}
+        a_qcs = {n: n.final_activation_quantization_cfg for n in graph.nodes}
         final_ru = ru_calculator.compute_resource_utilization(TargetInclusionCriterion.AnyQuantized,
-                                                              BitwidthMode.QCustom,
-                                                              act_qcs=a_qcs, w_qcs=w_qcs, ru_targets=ru_targets)
+                                                              BitwidthMode.QCustom, act_qcs=a_qcs, w_qcs=w_qcs,
+                                                              ru_targets=ru_targets, allow_unused_qcs=True)
         summary = final_ru.get_summary_str(restricted=True)
         Logger.info(f'Resource utilization for quantized mixed-precision targets:\n {summary}.')
     graph.user_info.final_resource_utilization = final_ru

model_compression_toolkit/data_generation/pytorch/optimization_functions/image_initilization.py CHANGED Viewed

@@ -15,11 +15,10 @@
 from functools import partial
 from typing import Tuple, Union, List, Callable, Dict
-import cv2
 from torch import Tensor
 from torchvision.transforms.transforms import _setup_size
 import torch
-import numpy as np
+import torch.nn.functional as F
 from torch.utils.data import Dataset, DataLoader
 from model_compression_toolkit.data_generation.common.enums import DataInitType
@@ -97,9 +96,8 @@ def diverse_sample(size: Tuple[int, ...]) -> Tensor:
     sample = random_std * torch.randn(size) + random_mean
     # filtering to make the image a bit smoother
-    kernel = np.ones((5, 5), np.float32) / 16
-    if sample.shape[1] < 500 and sample.shape[2] < 500:
-        sample = torch.from_numpy(cv2.filter2D(sample.float().detach().cpu().numpy(), -1, kernel))
+    kernel = torch.ones(NUM_INPUT_CHANNELS, NUM_INPUT_CHANNELS, 5, 5) / 16
+    sample = F.conv2d(sample, kernel, padding=1)
     return sample.float()
 def default_data_init_fn(

model_compression_toolkit/logger.py CHANGED Viewed

@@ -136,7 +136,6 @@ class Logger:
             msg: Message to log.
         """
-        print(msg)
         Logger.get_logger().info(msg)
     @staticmethod
@@ -148,7 +147,6 @@ class Logger:
             msg: Message to log.
         """
-        print(msg)
         Logger.get_logger().warning(msg)
     @staticmethod

{mct_nightly-2.3.0.20250127.521.dist-info → mct_nightly-2.3.0.20250129.508.dist-info}/LICENSE.md RENAMED Viewed

File without changes

{mct_nightly-2.3.0.20250127.521.dist-info → mct_nightly-2.3.0.20250129.508.dist-info}/WHEEL RENAMED Viewed

File without changes

{mct_nightly-2.3.0.20250127.521.dist-info → mct_nightly-2.3.0.20250129.508.dist-info}/top_level.txt RENAMED Viewed

File without changes

mct-nightly 2.3.0.20250127.521__py3-none-any.whl → 2.3.0.20250129.508__py3-none-any.whl

mct-nightly 2.3.0.20250127.521py3-none-any.whl → 2.3.0.20250129.508py3-none-any.whl