PyPI - mct-nightly - Versions diffs - 2.1.0.20240708.453__py3-none-any.whl → 2.1.0.20240709.429__py3-none-any.whl - Mend

mct-nightly 2.1.0.20240708.453py3-none-any.whl → 2.1.0.20240709.429py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (31) hide show

model_compression_toolkit/gptq/common/gptq_training.py CHANGED Viewed

@@ -26,8 +26,8 @@ from model_compression_toolkit.gptq.common.gptq_framework_implementation import
 from model_compression_toolkit.gptq.common.gptq_graph import get_compare_points
 from model_compression_toolkit.core.common.model_builder_mode import ModelBuilderMode
 from model_compression_toolkit.logger import Logger
-from model_compression_toolkit.core.common.hessian import HessianInfoService, TraceHessianRequest, HessianMode, \
-    HessianInfoGranularity
+from model_compression_toolkit.core.common.hessian import HessianInfoService, HessianScoresRequest, HessianMode, \
+    HessianScoresGranularity
 from model_compression_toolkit.core.common.hessian import hessian_info_utils as hessian_utils
@@ -55,7 +55,7 @@ class GPTQTrainer(ABC):
             gptq_config: GradientPTQConfig with parameters about the tuning process.
             fw_impl: Framework implementation
             fw_info: Framework information
-            hessian_info_service: HessianInfoService for fetching and computing Hessian's trace approximation.
+            hessian_info_service: HessianInfoService for fetching and computing Hessian-approximation information.
         """
         self.graph_float = copy.deepcopy(graph_float)
         self.graph_quant = copy.deepcopy(graph_quant)
@@ -132,10 +132,10 @@ class GPTQTrainer(ABC):
     def compute_hessian_based_weights(self) -> np.ndarray:
         """
-        Computes trace hessian approximations per layer w.r.t activations of the interest points.
+        Computes scores based on the hessian approximation per layer w.r.t activations of the interest points.
         Returns:
-            np.ndarray: Trace hessian approximations.
+            np.ndarray: Scores based on the hessian matrix approximation.
         """
         if not self.gptq_config.use_hessian_based_weights:
             # Return a default weight distribution based on the number of compare points
@@ -143,15 +143,15 @@ class GPTQTrainer(ABC):
             return np.asarray([1 / num_nodes for _ in range(num_nodes)])
         # Fetch hessian approximations for each target node
-        compare_point_to_trace_hessian_approximations = self._fetch_hessian_approximations()
+        compare_point_to_hessian_approx_scores = self._fetch_hessian_approximations()
         # Process the fetched hessian approximations to gather them per images
-        trace_hessian_approx_by_image = (
-            self._process_hessian_approximations(compare_point_to_trace_hessian_approximations))
+        hessian_approx_score_by_image = (
+            self._process_hessian_approximations(compare_point_to_hessian_approx_scores))
         # Check if log normalization is enabled in the configuration
         if self.gptq_config.hessian_weights_config.log_norm:
             # Calculate the mean of the approximations across images
-            mean_approx_scores = np.mean(trace_hessian_approx_by_image, axis=0)
+            mean_approx_scores = np.mean(hessian_approx_score_by_image, axis=0)
             # Reduce unnecessary dims, should remain with one dimension for the number of nodes
             mean_approx_scores = np.squeeze(mean_approx_scores)
             # Handle zero values to avoid log(0)
@@ -170,7 +170,7 @@ class GPTQTrainer(ABC):
             return log_weights - np.min(log_weights)
         else:
             # If log normalization is not enabled, return the mean of the approximations across images
-            return np.mean(trace_hessian_approx_by_image, axis=0)
+            return np.mean(hessian_approx_score_by_image, axis=0)
     def _fetch_hessian_approximations(self) -> Dict[BaseNode, List[List[float]]]:
         """
@@ -180,13 +180,13 @@ class GPTQTrainer(ABC):
             Mapping of target nodes to their hessian approximations.
         """
         approximations = {}
-        trace_hessian_request = TraceHessianRequest(
+        hessian_scores_request = HessianScoresRequest(
             mode=HessianMode.ACTIVATION,
-            granularity=HessianInfoGranularity.PER_TENSOR,
+            granularity=HessianScoresGranularity.PER_TENSOR,
             target_nodes=self.compare_points
         )
         node_approximations = self.hessian_service.fetch_hessian(
-            trace_hessian_request=trace_hessian_request,
+            hessian_scores_request=hessian_scores_request,
             required_size=self.gptq_config.hessian_weights_config.hessians_num_samples,
             batch_size=self.gptq_config.hessian_weights_config.hessian_batch_size
         )
@@ -203,21 +203,21 @@ class GPTQTrainer(ABC):
         Returns list of lists where each inner list is the approximations per image to all interest points.
         Args:
-            approximations: Hessian trace approximations mapping to process.
+            approximations: Hessian scores approximations mapping to process.
             Dictionary of Node to a list of the length of the number of images that were fetched.
         Returns:
             Processed approximations as a list of lists where each inner list is the approximations
              per image to all interest points.
         """
-        trace_hessian_approx_by_image = [[approximations[target_node][image_idx] for target_node in self.compare_points]
+        hessian_approx_score_by_image = [[approximations[target_node][image_idx] for target_node in self.compare_points]
                                          for image_idx in
                                          range(self.gptq_config.hessian_weights_config.hessians_num_samples)]
         if self.gptq_config.hessian_weights_config.norm_scores:
-            trace_hessian_approx_by_image = hessian_utils.normalize_scores(trace_hessian_approx_by_image)
+            hessian_approx_score_by_image = hessian_utils.normalize_scores(hessian_approx_score_by_image)
-        return trace_hessian_approx_by_image
+        return hessian_approx_score_by_image
     def _get_approximations_by_interest_point(self, approximations: Dict, image_idx: int) -> List:
         """
@@ -232,25 +232,25 @@ class GPTQTrainer(ABC):
         """
         approx_by_interest_point = []
         for target_node in self.compare_points:
-            trace_approx = approximations[target_node][image_idx]
-            self._validate_trace_approximation(trace_approx)
-            approx_by_interest_point.append(trace_approx[0])
+            hessian_approx_scores = approximations[target_node][image_idx]
+            self._validate_scores_approximation(hessian_approx_scores)
+            approx_by_interest_point.append(hessian_approx_scores[0])
         return approx_by_interest_point
     @staticmethod
-    def _validate_trace_approximation(trace_approx: List):
+    def _validate_scores_approximation(hessian_approx_scores: List):
         """
-        Validates the structure and length of the trace approximation.
+        Validates the structure and length of the Hessian-approximation scores.
         Args:
-            trace_approx: Trace approximation to validate.
+            hessian_approx_scores: Scores to validate.
         """
-        if not isinstance(trace_approx, list):
-            Logger.critical(f"Trace approximation was expected to be a list but is of type: {type(trace_approx)}.")   # pragma: no cover
-        if len(trace_approx) != 1:
-            Logger.critical(f"Trace approximation was expected to have a length of 1 "
+        if not isinstance(hessian_approx_scores, list):
+            Logger.critical(f"Scores approximation was expected to be a list but is of type: {type(hessian_approx_scores)}.")   # pragma: no cover
+        if len(hessian_approx_scores) != 1:
+            Logger.critical(f"Scores approximation was expected to have a length of 1 "
                             f"(for computations with granularity set to 'HessianInfoGranularity.PER_TENSOR') "
-                            f"but has a length of {len(trace_approx)}."
+                            f"but has a length of {len(hessian_approx_scores)}."
             )   # pragma: no cover
@@ -291,7 +291,7 @@ def gptq_training(graph_float: Graph,
                   representative_data_gen: Callable,
                   fw_impl: GPTQFrameworkImplemantation,
                   fw_info: FrameworkInfo,
-                  hessian_info_service: HessianInfoService=None) -> Graph:
+                  hessian_info_service: HessianInfoService = None) -> Graph:
     """
     GPTQ training process using knowledge distillation with a teacher network (float model) and a student network (quantized model).
     Args:
@@ -301,7 +301,7 @@ def gptq_training(graph_float: Graph,
         representative_data_gen: Dataset to use for inputs of the models.
         fw_impl: Framework implementation
         fw_info: Framework information
-        hessian_info_service: HessianInfoService to fetch Hessian traces approximations.
+        hessian_info_service: HessianInfoService to fetch information based on the Hessian approximation.
     Returns:
         Quantized graph for export

model_compression_toolkit/gptq/keras/gptq_training.py CHANGED Viewed

@@ -74,7 +74,7 @@ class KerasGPTQTrainer(GPTQTrainer):
             fw_impl: FrameworkImplementation object with a specific framework methods implementation.
             fw_info: Framework information.
             representative_data_gen: Dataset to use for inputs of the models.
-            hessian_info_service: HessianInfoService for fetching and computing Hessian's trace approximation.
+            hessian_info_service: HessianScoresService for fetching and computing Hessian's approximation scores.
         """
         super().__init__(graph_float,

model_compression_toolkit/gptq/pytorch/gptq_training.py CHANGED Viewed

@@ -64,7 +64,7 @@ class PytorchGPTQTrainer(GPTQTrainer):
             fw_impl: FrameworkImplementation object with a specific framework methods implementation.
             fw_info: Framework information
             representative_data_gen: Dataset to use for inputs of the models.
-            hessian_info_service: HessianInfoService to fetch approximations of the hessian traces for the float model.
+            hessian_info_service: HessianInfoService to fetch info based on the hessian approximation of the float model.
         """
         super().__init__(graph_float,
                          graph_quant,

model_compression_toolkit/gptq/runner.py CHANGED Viewed

@@ -54,7 +54,7 @@ def _apply_gptq(gptq_config: GradientPTQConfig,
         tg_bias: Graph of quantized model.
         fw_info: Information needed for quantization about the specific framework (e.g., kernel channels indices, groups of layers by how they should be quantized, etc.).
         fw_impl: Framework implementation per framework
-        hessian_info_service: HessianInfoService to fetch approximations of the hessian traces for the float model.
+        hessian_info_service: HessianInfoService to fetch information based on the hessian approximation for the float model.
     Returns:
     """
@@ -94,7 +94,7 @@ def gptq_runner(tg: Graph,
         fw_info: Information needed for quantization about the specific framework (e.g., kernel channels indices, groups of layers by how they should be quantized, etc.)
         fw_impl: FrameworkImplementation object with a specific framework methods implementation.
         tb_w: A TensorBoardWriter object initialized with the logger dir path if it was set, or None otherwise.
-        hessian_info_service: HessianInfoService to fetch approximations of the hessian traces for the float model.
+        hessian_info_service: HessianScoresService to fetch approximations of the hessian scores for the float model.
     Returns:
         A graph after model weights GPTQ fine-tuning.

model_compression_toolkit/qat/pytorch/quantization_facade.py CHANGED Viewed

@@ -153,7 +153,7 @@ if FOUND_TORCH:
         tb_w = init_tensorboard_writer(DEFAULT_PYTORCH_INFO)
         fw_impl = PytorchImplementation()
-        # Ignore trace hessian service as we do not use it here
+        # Ignore hessian scores service as we do not use it here
         tg, bit_widths_config, _ = core_runner(in_model=in_model,
                                                representative_data_gen=representative_data_gen,
                                                core_config=core_config,

{mct_nightly-2.1.0.20240708.453.dist-info → mct_nightly-2.1.0.20240709.429.dist-info}/LICENSE.md RENAMED Viewed

File without changes

{mct_nightly-2.1.0.20240708.453.dist-info → mct_nightly-2.1.0.20240709.429.dist-info}/WHEEL RENAMED Viewed

File without changes

{mct_nightly-2.1.0.20240708.453.dist-info → mct_nightly-2.1.0.20240709.429.dist-info}/top_level.txt RENAMED Viewed

File without changes

mct-nightly 2.1.0.20240708.453__py3-none-any.whl → 2.1.0.20240709.429__py3-none-any.whl

mct-nightly 2.1.0.20240708.453py3-none-any.whl → 2.1.0.20240709.429py3-none-any.whl