mct-nightly 2.3.0.20250511.614__tar.gz → 2.3.0.20250513.611__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/PKG-INFO +1 -1
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/mct_nightly.egg-info/PKG-INFO +1 -1
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/__init__.py +1 -1
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/framework_implementation.py +6 -33
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/mixed_precision/mixed_precision_quantization_config.py +22 -3
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/mixed_precision/mixed_precision_search_facade.py +8 -5
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/mixed_precision/mixed_precision_search_manager.py +69 -58
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/mixed_precision/sensitivity_evaluation.py +82 -79
- mct_nightly-2.3.0.20250513.611/model_compression_toolkit/core/common/mixed_precision/set_layer_to_bitwidth.py +56 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/mixed_precision/solution_refinement_procedure.py +5 -4
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/quantization/node_quantization_config.py +7 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/similarity_analyzer.py +1 -1
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/back2framework/mixed_precision_model_builder.py +37 -73
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/keras_implementation.py +8 -45
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/mixed_precision/configurable_activation_quantizer.py +7 -5
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/mixed_precision/configurable_weights_quantizer.py +6 -5
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/back2framework/mixed_precision_model_builder.py +46 -78
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/mixed_precision/configurable_activation_quantizer.py +7 -9
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/mixed_precision/configurable_weights_quantizer.py +12 -10
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/pytorch_implementation.py +6 -41
- mct_nightly-2.3.0.20250511.614/model_compression_toolkit/core/common/mixed_precision/set_layer_to_bitwidth.py +0 -50
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/LICENSE.md +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/README.md +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/mct_nightly.egg-info/SOURCES.txt +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/mct_nightly.egg-info/dependency_links.txt +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/mct_nightly.egg-info/requires.txt +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/mct_nightly.egg-info/top_level.txt +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/constants.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/analyzer.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/back2framework/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/back2framework/base_model_builder.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/base_substitutions.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/collectors/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/collectors/base_collector.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/collectors/histogram_collector.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/collectors/mean_collector.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/collectors/min_max_per_channel_collector.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/collectors/statistics_collector.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/collectors/weighted_histogram_collector.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/framework_info.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/fusion/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/fusion/fusing_info.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/fusion/graph_fuser.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/graph/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/graph/base_graph.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/graph/base_node.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/graph/edge.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/graph/functional_node.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/graph/graph_matchers.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/graph/graph_searches.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/graph/memory_graph/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/graph/memory_graph/bipartite_graph.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/graph/memory_graph/compute_graph_max_cut.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/graph/memory_graph/cut.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/graph/memory_graph/max_cut_astar.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/graph/memory_graph/memory_element.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/graph/memory_graph/memory_graph.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/graph/virtual_activation_weights_node.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/hessian/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/hessian/hessian_info_service.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/hessian/hessian_info_utils.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/hessian/hessian_scores_calculator.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/hessian/hessian_scores_request.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/matchers/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/matchers/base_graph_filter.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/matchers/base_matcher.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/matchers/edge_matcher.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/matchers/function.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/matchers/node_matcher.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/matchers/walk_matcher.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/memory_computation.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/mixed_precision/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/mixed_precision/bit_width_setter.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/mixed_precision/configurable_quant_id.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/mixed_precision/configurable_quantizer_utils.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/mixed_precision/distance_weighting.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/mixed_precision/mixed_precision_candidates_filter.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/mixed_precision/mixed_precision_ru_helper.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/mixed_precision/resource_utilization_tools/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/mixed_precision/resource_utilization_tools/resource_utilization.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/mixed_precision/resource_utilization_tools/resource_utilization_calculator.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/mixed_precision/resource_utilization_tools/resource_utilization_data.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/mixed_precision/search_methods/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/mixed_precision/search_methods/linear_programming.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/model_builder_mode.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/model_collector.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/model_validation.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/network_editors/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/network_editors/actions.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/network_editors/edit_network.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/network_editors/node_filters.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/node_prior_info.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/pruning/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/pruning/channels_grouping.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/pruning/greedy_mask_calculator.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/pruning/importance_metrics/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/pruning/importance_metrics/base_importance_metric.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/pruning/importance_metrics/importance_metric_factory.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/pruning/importance_metrics/lfh_importance_metric.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/pruning/mask/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/pruning/mask/per_channel_mask.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/pruning/mask/per_simd_group_mask.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/pruning/memory_calculator.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/pruning/prune_graph.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/pruning/pruner.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/pruning/pruning_config.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/pruning/pruning_framework_implementation.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/pruning/pruning_info.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/pruning/pruning_section.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/quantization/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/quantization/bit_width_config.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/quantization/candidate_node_quantization_config.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/quantization/core_config.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/quantization/debug_config.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/quantization/filter_nodes_candidates.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/quantization/quantization_config.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/quantization/quantization_fn_selection.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/quantization/quantization_params_fn_selection.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/quantization/quantization_params_generation/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/quantization/quantization_params_generation/error_functions.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/quantization/quantization_params_generation/lut_kmeans_params.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/quantization/quantization_params_generation/outlier_filter.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/quantization/quantization_params_generation/power_of_two_selection.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/quantization/quantization_params_generation/qparams_activations_computation.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/quantization/quantization_params_generation/qparams_computation.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/quantization/quantization_params_generation/qparams_search.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/quantization/quantization_params_generation/qparams_weights_computation.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/quantization/quantization_params_generation/symmetric_selection.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/quantization/quantization_params_generation/uniform_selection.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/quantization/quantize_graph_weights.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/quantization/quantize_node.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/quantization/quantizers/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/quantization/quantizers/lut_kmeans_quantizer.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/quantization/quantizers/quantizers_helpers.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/quantization/quantizers/uniform_quantizers.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/quantization/set_node_quantization_config.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/statistics_correction/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/statistics_correction/apply_activation_bias_correction_to_graph.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/statistics_correction/apply_bias_correction_to_graph.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/statistics_correction/apply_second_moment_correction_to_graph.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/statistics_correction/compute_activation_bias_correction_of_graph.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/statistics_correction/compute_bias_correction_of_graph.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/statistics_correction/statistics_correction.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/substitutions/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/substitutions/apply_substitutions.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/substitutions/batchnorm_folding.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/substitutions/batchnorm_reconstruction.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/substitutions/batchnorm_refusing.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/substitutions/linear_collapsing.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/substitutions/linear_collapsing_substitution.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/substitutions/remove_identity.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/substitutions/residual_collapsing.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/substitutions/scale_equalization.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/substitutions/shift_negative_activation.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/substitutions/softmax_shift.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/substitutions/virtual_activation_weights_composition.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/substitutions/weights_activation_split.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/user_info.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/visualization/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/visualization/final_config_visualizer.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/visualization/nn_visualizer.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/common/visualization/tensorboard_writer.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/graph_prep_runner.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/back2framework/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/back2framework/factory_model_builder.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/back2framework/float_model_builder.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/back2framework/instance_builder.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/back2framework/keras_model_builder.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/back2framework/quantized_model_builder.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/constants.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/custom_layer_validation.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/data_util.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/default_framework_info.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/graph_substitutions/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/graph_substitutions/substitutions/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/graph_substitutions/substitutions/activation_decomposition.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/graph_substitutions/substitutions/batchnorm_folding.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/graph_substitutions/substitutions/batchnorm_reconstruction.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/graph_substitutions/substitutions/batchnorm_refusing.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/graph_substitutions/substitutions/concat_threshold_update.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/graph_substitutions/substitutions/conv_funcs_to_layer.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/graph_substitutions/substitutions/dwconv_to_conv.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/graph_substitutions/substitutions/input_scaling.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/graph_substitutions/substitutions/linear_collapsing.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/graph_substitutions/substitutions/matmul_substitution.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/graph_substitutions/substitutions/multi_head_attention_decomposition.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/graph_substitutions/substitutions/relu_bound_to_power_of_2.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/graph_substitutions/substitutions/remove_identity.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/graph_substitutions/substitutions/residual_collapsing.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/graph_substitutions/substitutions/scale_equalization.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/graph_substitutions/substitutions/separableconv_decomposition.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/graph_substitutions/substitutions/shift_negative_activation.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/graph_substitutions/substitutions/sigmoid_mul_to_swish.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/graph_substitutions/substitutions/softmax_shift.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/graph_substitutions/substitutions/virtual_activation_weights_composition.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/graph_substitutions/substitutions/weights_activation_split.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/hessian/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/hessian/activation_hessian_scores_calculator_keras.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/hessian/hessian_scores_calculator_keras.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/hessian/weights_hessian_scores_calculator_keras.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/keras_model_validation.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/keras_node_prior_info.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/mixed_precision/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/pruning/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/pruning/pruning_keras_implementation.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/quantizer/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/quantizer/fake_quant_builder.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/quantizer/lut_fake_quant.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/reader/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/reader/common.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/reader/connectivity_handler.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/reader/nested_model/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/reader/nested_model/edges_merger.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/reader/nested_model/nested_model_handler.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/reader/nested_model/nodes_merger.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/reader/nested_model/outputs_merger.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/reader/node_builder.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/reader/reader.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/resource_utilization_data_facade.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/statistics_correction/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/statistics_correction/apply_second_moment_correction.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/statistics_correction/keras_compute_activation_bias_correction_of_graph.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/tf_tensor_numpy.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/keras/visualization/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/back2framework/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/back2framework/factory_model_builder.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/back2framework/float_model_builder.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/back2framework/instance_builder.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/back2framework/pytorch_model_builder.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/back2framework/quantization_wrapper/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/back2framework/quantization_wrapper/quantized_layer_wrapper.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/back2framework/quantization_wrapper/wrapper_quantize_config.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/back2framework/quantized_model_builder.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/constants.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/data_util.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/default_framework_info.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/graph_substitutions/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/graph_substitutions/substitutions/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/graph_substitutions/substitutions/batchnorm_folding.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/graph_substitutions/substitutions/batchnorm_reconstruction.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/graph_substitutions/substitutions/batchnorm_refusing.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/graph_substitutions/substitutions/concat_threshold_update.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/graph_substitutions/substitutions/const_holder_conv.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/graph_substitutions/substitutions/convtranspose_dynamic_padding.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/graph_substitutions/substitutions/functional_batch_norm.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/graph_substitutions/substitutions/functional_layer_norm.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/graph_substitutions/substitutions/functional_linear.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/graph_substitutions/substitutions/linear_collapsing.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/graph_substitutions/substitutions/matmul_decomposition.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/graph_substitutions/substitutions/multi_head_attention_decomposition.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/graph_substitutions/substitutions/relu_bound_to_power_of_2.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/graph_substitutions/substitutions/remove_identity.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/graph_substitutions/substitutions/reshape_with_static_shapes.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/graph_substitutions/substitutions/residual_collapsing.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/graph_substitutions/substitutions/scale_equalization.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/graph_substitutions/substitutions/scaled_dot_product_attention.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/graph_substitutions/substitutions/shift_negative_activation.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/graph_substitutions/substitutions/softmax_shift.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/graph_substitutions/substitutions/transform_function_call_method.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/graph_substitutions/substitutions/virtual_activation_weights_composition.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/graph_substitutions/substitutions/weights_activation_split.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/hessian/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/hessian/activation_hessian_scores_calculator_pytorch.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/hessian/hessian_scores_calculator_pytorch.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/hessian/weights_hessian_scores_calculator_pytorch.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/mixed_precision/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/pruning/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/pruning/pruning_pytorch_implementation.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/pytorch_device_config.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/pytorch_node_prior_info.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/quantizer/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/quantizer/fake_quant_builder.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/quantizer/lut_fake_quant.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/reader/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/reader/graph_builders.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/reader/node_holders.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/reader/reader.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/resource_utilization_data_facade.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/statistics_correction/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/statistics_correction/apply_second_moment_correction.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/statistics_correction/pytorch_compute_activation_bias_correction_of_graph.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/pytorch/utils.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/quantization_prep_runner.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/core/runner.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/common/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/common/constants.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/common/data_generation.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/common/data_generation_config.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/common/enums.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/common/image_pipeline.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/common/model_info_exctractors.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/common/optimization_utils.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/keras/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/keras/constants.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/keras/image_operations.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/keras/image_pipeline.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/keras/keras_data_generation.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/keras/model_info_exctractors.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/keras/optimization_functions/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/keras/optimization_functions/batchnorm_alignment_functions.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/keras/optimization_functions/bn_layer_weighting_functions.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/keras/optimization_functions/image_initilization.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/keras/optimization_functions/lr_scheduler.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/keras/optimization_functions/output_loss_functions.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/keras/optimization_functions/scheduler_step_functions.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/keras/optimization_utils.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/pytorch/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/pytorch/constants.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/pytorch/image_operations.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/pytorch/image_pipeline.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/pytorch/model_info_exctractors.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/pytorch/optimization_functions/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/pytorch/optimization_functions/batchnorm_alignment_functions.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/pytorch/optimization_functions/bn_layer_weighting_functions.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/pytorch/optimization_functions/image_initilization.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/pytorch/optimization_functions/lr_scheduler.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/pytorch/optimization_functions/output_loss_functions.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/pytorch/optimization_functions/scheduler_step_functions.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/pytorch/optimization_utils.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/data_generation/pytorch/pytorch_data_generation.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/defaultdict.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_exporter/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_exporter/fw_agonstic/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_exporter/fw_agonstic/exporter.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_exporter/fw_agonstic/quantization_format.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_exporter/keras/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_exporter/keras/base_keras_exporter.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_exporter/keras/export_serialization_format.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_exporter/keras/fakely_quant_keras_exporter.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_exporter/keras/fakely_quant_tflite_exporter.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_exporter/keras/int8_tflite_exporter.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_exporter/keras/keras_export_facade.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_exporter/keras/mctq_keras_exporter.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_exporter/pytorch/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_exporter/pytorch/base_pytorch_exporter.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_exporter/pytorch/export_serialization_format.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_exporter/pytorch/fakely_quant_onnx_pytorch_exporter.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_exporter/pytorch/fakely_quant_torchscript_pytorch_exporter.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_exporter/pytorch/pytorch_export_facade.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_wrapper/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_wrapper/fw_agnostic/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_wrapper/fw_agnostic/get_inferable_quantizers.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_wrapper/keras/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_wrapper/keras/builder/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_wrapper/keras/builder/fully_quantized_model_builder.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_wrapper/keras/builder/node_to_quantizer.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_wrapper/keras/validate_layer.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_wrapper/pytorch/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_wrapper/pytorch/builder/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_wrapper/pytorch/builder/fully_quantized_model_builder.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_wrapper/pytorch/builder/node_to_quantizer.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/exporter/model_wrapper/pytorch/validate_layer.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/common/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/common/gptq_config.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/common/gptq_constants.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/common/gptq_framework_implementation.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/common/gptq_graph.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/common/gptq_training.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/common/gradual_activation_quantization.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/common/regularization_factory.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/keras/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/keras/gptq_keras_implementation.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/keras/gptq_loss.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/keras/gptq_training.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/keras/graph_info.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/keras/quantization_facade.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/keras/quantizer/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/keras/quantizer/base_keras_gptq_quantizer.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/keras/quantizer/quant_utils.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/keras/quantizer/quantization_builder.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/keras/quantizer/soft_rounding/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/keras/quantizer/soft_rounding/soft_quantizer_reg.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/keras/quantizer/soft_rounding/symmetric_soft_quantizer.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/keras/quantizer/soft_rounding/uniform_soft_quantizer.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/keras/quantizer/ste_rounding/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/keras/quantizer/ste_rounding/symmetric_ste.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/pytorch/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/pytorch/gptq_loss.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/pytorch/gptq_pytorch_implementation.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/pytorch/gptq_training.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/pytorch/graph_info.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/pytorch/quantization_facade.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/pytorch/quantizer/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/pytorch/quantizer/base_pytorch_gptq_quantizer.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/pytorch/quantizer/quant_utils.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/pytorch/quantizer/quantization_builder.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/pytorch/quantizer/soft_rounding/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/pytorch/quantizer/soft_rounding/soft_quantizer_reg.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/pytorch/quantizer/soft_rounding/symmetric_soft_quantizer.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/pytorch/quantizer/soft_rounding/uniform_soft_quantizer.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/pytorch/quantizer/ste_rounding/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/pytorch/quantizer/ste_rounding/symmetric_ste.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/gptq/runner.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/logger.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/metadata.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/pruning/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/pruning/keras/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/pruning/keras/pruning_facade.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/pruning/pytorch/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/pruning/pytorch/pruning_facade.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/ptq/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/ptq/keras/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/ptq/keras/quantization_facade.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/ptq/pytorch/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/ptq/pytorch/quantization_facade.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/ptq/runner.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/qat/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/qat/common/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/qat/common/qat_config.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/qat/keras/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/qat/keras/quantization_facade.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/qat/keras/quantizer/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/qat/keras/quantizer/base_keras_qat_weight_quantizer.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/qat/keras/quantizer/lsq/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/qat/keras/quantizer/lsq/symmetric_lsq.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/qat/keras/quantizer/lsq/uniform_lsq.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/qat/keras/quantizer/quant_utils.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/qat/keras/quantizer/quantization_builder.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/qat/keras/quantizer/ste_rounding/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/qat/keras/quantizer/ste_rounding/symmetric_ste.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/qat/keras/quantizer/ste_rounding/uniform_ste.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/qat/pytorch/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/qat/pytorch/quantization_facade.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/qat/pytorch/quantizer/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/qat/pytorch/quantizer/base_pytorch_qat_weight_quantizer.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/qat/pytorch/quantizer/lsq/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/qat/pytorch/quantizer/lsq/symmetric_lsq.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/qat/pytorch/quantizer/lsq/uniform_lsq.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/qat/pytorch/quantizer/quantization_builder.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/qat/pytorch/quantizer/ste_rounding/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/qat/pytorch/quantizer/ste_rounding/symmetric_ste.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/qat/pytorch/quantizer/ste_rounding/uniform_ste.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/constants.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/immutable.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/schema/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/schema/mct_current_schema.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/schema/schema_compatability.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/schema/schema_functions.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/schema/v1.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/schema/v2.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/targetplatform2framework/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/targetplatform2framework/attach2fw.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/targetplatform2framework/attach2keras.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/targetplatform2framework/attach2pytorch.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/targetplatform2framework/attribute_filter.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/targetplatform2framework/current_tpc.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/targetplatform2framework/framework_quantization_capabilities.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/targetplatform2framework/framework_quantization_capabilities_component.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/targetplatform2framework/layer_filter_params.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/targetplatform2framework/operations_to_layers.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/tpc_io_handler.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/tpc_models/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/tpc_models/get_target_platform_capabilities.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/tpc_models/imx500_tpc/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/tpc_models/imx500_tpc/latest/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/tpc_models/imx500_tpc/v1/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/tpc_models/imx500_tpc/v1/tpc.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/tpc_models/qnnpack_tpc/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/tpc_models/qnnpack_tpc/latest/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/tpc_models/qnnpack_tpc/v1/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/tpc_models/qnnpack_tpc/v1/tpc.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/tpc_models/tflite_tpc/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/tpc_models/tflite_tpc/latest/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/tpc_models/tflite_tpc/v1/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/target_platform_capabilities/tpc_models/tflite_tpc/v1/tpc.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/common/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/common/annealing_schedulers.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/common/base_trainable_quantizer.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/common/constants.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/common/get_quantizer_config.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/common/get_quantizers.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/common/quant_utils.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/common/trainable_quantizer_config.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/common/training_method.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/common/util.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/keras/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/keras/activation_quantizers/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/keras/activation_quantizers/base_activation_quantizer.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/keras/activation_quantizers/lsq/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/keras/activation_quantizers/lsq/symmetric_lsq.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/keras/activation_quantizers/lsq/uniform_lsq.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/keras/activation_quantizers/ste/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/keras/activation_quantizers/ste/symmetric_ste.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/keras/activation_quantizers/ste/uniform_ste.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/keras/annealing_schedulers.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/keras/base_keras_quantizer.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/keras/config_serialization.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/keras/load_model.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/keras/quantize_wrapper.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/keras/quantizer_utils.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/pytorch/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/pytorch/activation_quantizers/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/pytorch/activation_quantizers/base_activation_quantizer.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/pytorch/activation_quantizers/lsq/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/pytorch/activation_quantizers/lsq/symmetric_lsq.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/pytorch/activation_quantizers/lsq/uniform_lsq.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/pytorch/activation_quantizers/ste/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/pytorch/activation_quantizers/ste/symmetric_ste.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/pytorch/activation_quantizers/ste/uniform_ste.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/pytorch/annealing_schedulers.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/pytorch/base_pytorch_quantizer.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/trainable_infrastructure/pytorch/quantizer_utils.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/verify_packages.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/xquant/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/xquant/common/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/xquant/common/constants.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/xquant/common/core_report_generator.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/xquant/common/dataset_utils.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/xquant/common/framework_report_utils.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/xquant/common/model_analyzer.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/xquant/common/model_folding_utils.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/xquant/common/similarity_calculator.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/xquant/common/similarity_functions.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/xquant/common/tensorboard_utils.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/xquant/common/xquant_config.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/xquant/keras/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/xquant/keras/dataset_utils.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/xquant/keras/facade_xquant_report.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/xquant/keras/keras_report_utils.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/xquant/keras/model_analyzer.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/xquant/keras/similarity_functions.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/xquant/keras/tensorboard_utils.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/xquant/pytorch/__init__.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/xquant/pytorch/dataset_utils.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/xquant/pytorch/facade_xquant_report.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/xquant/pytorch/model_analyzer.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/xquant/pytorch/pytorch_report_utils.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/xquant/pytorch/similarity_functions.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/model_compression_toolkit/xquant/pytorch/tensorboard_utils.py +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/setup.cfg +0 -0
- {mct_nightly-2.3.0.20250511.614 → mct_nightly-2.3.0.20250513.611}/setup.py +0 -0
@@ -27,4 +27,4 @@ from model_compression_toolkit import data_generation
|
|
27
27
|
from model_compression_toolkit import pruning
|
28
28
|
from model_compression_toolkit.trainable_infrastructure.keras.load_model import keras_load_quantized_model
|
29
29
|
|
30
|
-
__version__ = "2.3.0.
|
30
|
+
__version__ = "2.3.0.20250513.000611"
|
@@ -13,24 +13,20 @@
|
|
13
13
|
# limitations under the License.
|
14
14
|
# ==============================================================================
|
15
15
|
from abc import ABC, abstractmethod
|
16
|
-
from typing import Callable, Any, List, Tuple,
|
16
|
+
from typing import Callable, Any, List, Tuple, Generator, Type
|
17
17
|
|
18
18
|
import numpy as np
|
19
19
|
|
20
20
|
from model_compression_toolkit.constants import HESSIAN_NUM_ITERATIONS
|
21
|
-
from model_compression_toolkit.core import MixedPrecisionQuantizationConfig
|
22
21
|
from model_compression_toolkit.core import common
|
23
22
|
from model_compression_toolkit.core.common import BaseNode
|
24
|
-
from model_compression_toolkit.core.common.collectors.statistics_collector import BaseStatsCollector
|
25
23
|
from model_compression_toolkit.core.common.framework_info import FrameworkInfo
|
26
24
|
from model_compression_toolkit.core.common.graph.base_graph import Graph
|
27
|
-
from model_compression_toolkit.core.common.hessian import HessianScoresRequest
|
28
|
-
from model_compression_toolkit.core.common.mixed_precision.sensitivity_evaluation import SensitivityEvaluation
|
25
|
+
from model_compression_toolkit.core.common.hessian import HessianScoresRequest
|
29
26
|
from model_compression_toolkit.core.common.model_builder_mode import ModelBuilderMode
|
30
27
|
from model_compression_toolkit.core.common.node_prior_info import NodePriorInfo
|
31
28
|
from model_compression_toolkit.core.common.quantization.core_config import CoreConfig
|
32
29
|
from model_compression_toolkit.core.common.quantization.quantization_config import QuantizationConfig
|
33
|
-
from model_compression_toolkit.core.common.user_info import UserInformation
|
34
30
|
|
35
31
|
|
36
32
|
class FrameworkImplementation(ABC):
|
@@ -38,6 +34,10 @@ class FrameworkImplementation(ABC):
|
|
38
34
|
An abstract class with abstract methods that should be implemented when supporting a new
|
39
35
|
framework in MCT.
|
40
36
|
"""
|
37
|
+
weights_quant_layer_cls: Type
|
38
|
+
activation_quant_layer_cls: Type
|
39
|
+
configurable_weights_quantizer_cls: Type
|
40
|
+
configurable_activation_quantizer_cls: Type
|
41
41
|
|
42
42
|
@property
|
43
43
|
def constants(self):
|
@@ -327,33 +327,6 @@ class FrameworkImplementation(ABC):
|
|
327
327
|
f'framework\'s get_substitutions_after_second_moment_correction '
|
328
328
|
f'method.') # pragma: no cover
|
329
329
|
|
330
|
-
@abstractmethod
|
331
|
-
def get_sensitivity_evaluator(self,
|
332
|
-
graph: Graph,
|
333
|
-
quant_config: MixedPrecisionQuantizationConfig,
|
334
|
-
representative_data_gen: Callable,
|
335
|
-
fw_info: FrameworkInfo,
|
336
|
-
hessian_info_service: HessianInfoService = None,
|
337
|
-
disable_activation_for_metric: bool = False) -> SensitivityEvaluation:
|
338
|
-
"""
|
339
|
-
Creates and returns an object which handles the computation of a sensitivity metric for a mixed-precision
|
340
|
-
configuration (comparing to the float model).
|
341
|
-
|
342
|
-
Args:
|
343
|
-
graph: Graph to build its float and mixed-precision models.
|
344
|
-
quant_config: QuantizationConfig of how the model should be quantized.
|
345
|
-
representative_data_gen: Dataset to use for retrieving images for the models inputs.
|
346
|
-
fw_info: FrameworkInfo object with information about the specific framework's model.
|
347
|
-
disable_activation_for_metric: Whether to disable activation quantization when computing the MP metric.
|
348
|
-
hessian_info_service: HessianInfoService to fetch information based on Hessian-approximation.
|
349
|
-
|
350
|
-
Returns:
|
351
|
-
A function that computes the metric.
|
352
|
-
"""
|
353
|
-
|
354
|
-
raise NotImplementedError(f'{self.__class__.__name__} has to implement the '
|
355
|
-
f'framework\'s get_sensitivity_evaluator method.') # pragma: no cover
|
356
|
-
|
357
330
|
def get_node_prior_info(self, node: BaseNode,
|
358
331
|
fw_info: FrameworkInfo,
|
359
332
|
graph: Graph) -> NodePriorInfo:
|
@@ -14,11 +14,23 @@
|
|
14
14
|
# ==============================================================================
|
15
15
|
|
16
16
|
from dataclasses import dataclass, field
|
17
|
+
from enum import Enum
|
17
18
|
from typing import List, Callable, Optional
|
18
19
|
from model_compression_toolkit.constants import MP_DEFAULT_NUM_SAMPLES, ACT_HESSIAN_DEFAULT_BATCH_SIZE
|
19
20
|
from model_compression_toolkit.core.common.mixed_precision.distance_weighting import MpDistanceWeighting
|
20
21
|
|
21
22
|
|
23
|
+
class MpMetricNormalization(Enum):
|
24
|
+
"""
|
25
|
+
MAXBIT: normalize sensitivity metrics of layer candidates by max-bitwidth candidate (of that layer).
|
26
|
+
MINBIT: normalize sensitivity metrics of layer candidates by min-bitwidth candidate (of that layer).
|
27
|
+
NONE: no normalization.
|
28
|
+
"""
|
29
|
+
MAXBIT = 'MAXBIT'
|
30
|
+
MINBIT = 'MINBIT'
|
31
|
+
NONE = 'NONE'
|
32
|
+
|
33
|
+
|
22
34
|
@dataclass
|
23
35
|
class MixedPrecisionQuantizationConfig:
|
24
36
|
"""
|
@@ -27,7 +39,6 @@ class MixedPrecisionQuantizationConfig:
|
|
27
39
|
Args:
|
28
40
|
compute_distance_fn (Callable): Function to compute a distance between two tensors. If None, using pre-defined distance methods based on the layer type for each layer.
|
29
41
|
distance_weighting_method (MpDistanceWeighting): MpDistanceWeighting enum value that provides a function to use when weighting the distances among different layers when computing the sensitivity metric.
|
30
|
-
custom_metric_fn (Callable): Function to compute a custom metric. As input gets the model_mp and returns a float value for metric. If None, uses interest point metric.
|
31
42
|
num_of_images (int): Number of images to use to evaluate the sensitivity of a mixed-precision model comparing to the float model.
|
32
43
|
configuration_overwrite (List[int]): A list of integers that enables overwrite of mixed precision with a predefined one.
|
33
44
|
num_interest_points_factor (float): A multiplication factor between zero and one (represents percentage) to reduce the number of interest points used to calculate the distance metric.
|
@@ -36,11 +47,16 @@ class MixedPrecisionQuantizationConfig:
|
|
36
47
|
refine_mp_solution (bool): Whether to try to improve the final mixed-precision configuration using a greedy algorithm that searches layers to increase their bit-width, or not.
|
37
48
|
metric_normalization_threshold (float): A threshold for checking the mixed precision distance metric values, In case of values larger than this threshold, the metric will be scaled to prevent numerical issues.
|
38
49
|
hessian_batch_size (int): The Hessian computation batch size. used only if using mixed precision with Hessian-based objective.
|
39
|
-
|
50
|
+
metric_normalization (MpMetricNormalization): Metric normalization method.
|
51
|
+
metric_epsilon (float | None): ensure minimal distance between the metric for any non-max-bidwidth candidate
|
52
|
+
and a max-bitwidth candidate, i.e. metric(non-max-bitwidth) >= metric(max-bitwidth) + epsilon.
|
53
|
+
If none, the computed metrics are used as is.
|
54
|
+
custom_metric_fn (Callable): Function to compute a custom metric. As input gets the model_mp and returns a
|
55
|
+
float value for metric. If None, uses interest point metric.
|
40
56
|
|
57
|
+
"""
|
41
58
|
compute_distance_fn: Optional[Callable] = None
|
42
59
|
distance_weighting_method: MpDistanceWeighting = MpDistanceWeighting.AVG
|
43
|
-
custom_metric_fn: Optional[Callable] = None
|
44
60
|
num_of_images: int = MP_DEFAULT_NUM_SAMPLES
|
45
61
|
configuration_overwrite: Optional[List[int]] = None
|
46
62
|
num_interest_points_factor: float = field(default=1.0, metadata={"description": "Should be between 0.0 and 1.0"})
|
@@ -49,6 +65,9 @@ class MixedPrecisionQuantizationConfig:
|
|
49
65
|
refine_mp_solution: bool = True
|
50
66
|
metric_normalization_threshold: float = 1e10
|
51
67
|
hessian_batch_size: int = ACT_HESSIAN_DEFAULT_BATCH_SIZE
|
68
|
+
metric_normalization: MpMetricNormalization = MpMetricNormalization.NONE
|
69
|
+
metric_epsilon: Optional[float] = 1e-6
|
70
|
+
custom_metric_fn: Optional[Callable] = None
|
52
71
|
_is_mixed_precision_enabled: bool = field(init=False, default=False)
|
53
72
|
|
54
73
|
def __post_init__(self):
|
@@ -25,6 +25,7 @@ from model_compression_toolkit.core.common.mixed_precision.mixed_precision_searc
|
|
25
25
|
MixedPrecisionSearchManager
|
26
26
|
from model_compression_toolkit.core.common.mixed_precision.resource_utilization_tools.resource_utilization import \
|
27
27
|
ResourceUtilization
|
28
|
+
from model_compression_toolkit.core.common.mixed_precision.sensitivity_evaluation import SensitivityEvaluation
|
28
29
|
from model_compression_toolkit.core.common.mixed_precision.solution_refinement_procedure import \
|
29
30
|
greedy_solution_refinement_procedure
|
30
31
|
|
@@ -78,11 +79,12 @@ def search_bit_width(graph: Graph,
|
|
78
79
|
|
79
80
|
# Set Sensitivity Evaluator for MP search. It should always work with the original MP graph,
|
80
81
|
# even if a virtual graph was created (and is used only for BOPS utilization computation purposes)
|
81
|
-
se =
|
82
|
+
se = SensitivityEvaluation(
|
82
83
|
graph,
|
83
84
|
mp_config,
|
84
85
|
representative_data_gen=representative_data_gen,
|
85
86
|
fw_info=fw_info,
|
87
|
+
fw_impl=fw_impl,
|
86
88
|
disable_activation_for_metric=disable_activation_for_metric,
|
87
89
|
hessian_info_service=hessian_info_service)
|
88
90
|
|
@@ -96,10 +98,11 @@ def search_bit_width(graph: Graph,
|
|
96
98
|
|
97
99
|
# Search manager and LP are highly coupled, so LP search method was moved inside search manager.
|
98
100
|
search_manager = MixedPrecisionSearchManager(graph,
|
99
|
-
fw_info,
|
100
|
-
fw_impl,
|
101
|
-
se,
|
102
|
-
target_resource_utilization
|
101
|
+
fw_info=fw_info,
|
102
|
+
fw_impl=fw_impl,
|
103
|
+
sensitivity_evaluator=se,
|
104
|
+
target_resource_utilization=target_resource_utilization,
|
105
|
+
mp_config=mp_config)
|
103
106
|
nodes_bit_cfg = search_manager.search()
|
104
107
|
|
105
108
|
graph.skip_validation_check = False
|
@@ -12,6 +12,8 @@
|
|
12
12
|
# See the License for the specific language governing permissions and
|
13
13
|
# limitations under the License.
|
14
14
|
# ==============================================================================
|
15
|
+
import os
|
16
|
+
|
15
17
|
import itertools
|
16
18
|
|
17
19
|
import copy
|
@@ -19,7 +21,7 @@ from collections import defaultdict
|
|
19
21
|
|
20
22
|
from tqdm import tqdm
|
21
23
|
|
22
|
-
from typing import Dict, List, Tuple, Optional
|
24
|
+
from typing import Dict, List, Tuple, Optional, Set
|
23
25
|
|
24
26
|
import numpy as np
|
25
27
|
|
@@ -40,6 +42,8 @@ from model_compression_toolkit.core.common.mixed_precision.search_methods.linear
|
|
40
42
|
from model_compression_toolkit.core.common.mixed_precision.sensitivity_evaluation import SensitivityEvaluation
|
41
43
|
from model_compression_toolkit.core.common.substitutions.apply_substitutions import substitute
|
42
44
|
from model_compression_toolkit.logger import Logger
|
45
|
+
from model_compression_toolkit.core.common.mixed_precision.mixed_precision_quantization_config import \
|
46
|
+
MixedPrecisionQuantizationConfig, MpMetricNormalization
|
43
47
|
|
44
48
|
|
45
49
|
class MixedPrecisionSearchManager:
|
@@ -52,7 +56,8 @@ class MixedPrecisionSearchManager:
|
|
52
56
|
fw_info: FrameworkInfo,
|
53
57
|
fw_impl: FrameworkImplementation,
|
54
58
|
sensitivity_evaluator: SensitivityEvaluation,
|
55
|
-
target_resource_utilization: ResourceUtilization
|
59
|
+
target_resource_utilization: ResourceUtilization,
|
60
|
+
mp_config: MixedPrecisionQuantizationConfig):
|
56
61
|
"""
|
57
62
|
|
58
63
|
Args:
|
@@ -74,21 +79,21 @@ class MixedPrecisionSearchManager:
|
|
74
79
|
|
75
80
|
self.sensitivity_evaluator = sensitivity_evaluator
|
76
81
|
self.target_resource_utilization = target_resource_utilization
|
82
|
+
self.mp_config = mp_config
|
77
83
|
|
78
84
|
self.mp_topo_configurable_nodes = self.mp_graph.get_configurable_sorted_nodes(fw_info)
|
79
85
|
|
80
86
|
self.ru_targets = target_resource_utilization.get_restricted_targets()
|
81
|
-
self.
|
87
|
+
self.orig_graph_ru_helper = MixedPrecisionRUHelper(self.original_graph, fw_info, fw_impl)
|
82
88
|
|
83
89
|
self.min_ru_config: Dict[BaseNode, int] = self.mp_graph.get_min_candidates_config(fw_info)
|
84
|
-
self.max_ru_config: Dict[BaseNode, int] = self.mp_graph.get_max_candidates_config(fw_info)
|
85
90
|
|
86
|
-
self.
|
91
|
+
self.config_reconstructor = None
|
92
|
+
orig_min_config = self.min_ru_config
|
87
93
|
if self.using_virtual_graph:
|
88
|
-
|
89
|
-
|
90
|
-
|
91
|
-
self.min_ru = self.ru_helper.compute_utilization(self.ru_targets, self.min_ru_config)
|
94
|
+
self.config_reconstructor = ConfigReconstructionHelper(self.original_graph)
|
95
|
+
orig_min_config = self.config_reconstructor.reconstruct_full_configuration(self.min_ru_config)
|
96
|
+
self.min_ru = self.orig_graph_ru_helper.compute_utilization(self.ru_targets, orig_min_config)
|
92
97
|
|
93
98
|
def search(self) -> Dict[BaseNode, int]:
|
94
99
|
"""
|
@@ -100,7 +105,7 @@ class MixedPrecisionSearchManager:
|
|
100
105
|
mp_config = self._prepare_and_run_solver()
|
101
106
|
|
102
107
|
if self.using_virtual_graph:
|
103
|
-
mp_config = self.
|
108
|
+
mp_config = self.config_reconstructor.reconstruct_full_configuration(mp_config)
|
104
109
|
|
105
110
|
return mp_config
|
106
111
|
|
@@ -143,61 +148,64 @@ class MixedPrecisionSearchManager:
|
|
143
148
|
f"following targets: {unsatisfiable_targets}")
|
144
149
|
return rel_target_ru
|
145
150
|
|
146
|
-
def _build_sensitivity_mapping(self
|
151
|
+
def _build_sensitivity_mapping(self) -> Dict[BaseNode, List[float]]:
|
147
152
|
"""
|
148
153
|
This function measures the sensitivity of a change in a bitwidth of a layer on the entire model.
|
149
154
|
|
150
|
-
Args:
|
151
|
-
eps: if sensitivity for a non-max candidate is lower than for a max candidate, we set it to
|
152
|
-
sensitivity of a max candidate + epsilon.
|
153
|
-
|
154
155
|
Returns:
|
155
156
|
Mapping from nodes to their bitwidth candidates sensitivity.
|
156
157
|
"""
|
157
|
-
|
158
158
|
Logger.info('Starting to evaluate metrics')
|
159
|
-
|
160
|
-
|
161
|
-
|
162
|
-
|
163
|
-
|
164
|
-
|
165
|
-
|
166
|
-
|
167
|
-
|
168
|
-
|
169
|
-
|
170
|
-
|
171
|
-
|
172
|
-
|
173
|
-
|
174
|
-
|
175
|
-
|
176
|
-
|
159
|
+
norm_method = self.mp_config.metric_normalization
|
160
|
+
eps = self.mp_config.metric_epsilon
|
161
|
+
|
162
|
+
verbose = 'VERBOSE_MP_METRIC' in os.environ
|
163
|
+
|
164
|
+
def normalize(node_candidates_metrics, max_ind):
|
165
|
+
if norm_method == MpMetricNormalization.NONE:
|
166
|
+
return node_candidates_metrics
|
167
|
+
if norm_method == MpMetricNormalization.MAXBIT:
|
168
|
+
ref_ind = max_ind
|
169
|
+
elif norm_method == MpMetricNormalization.MINBIT:
|
170
|
+
ref_ind = node.find_min_candidate_index()
|
171
|
+
else: # pragma: no cover
|
172
|
+
raise ValueError(f'Unexpected MpMetricNormalization mode {norm_method}')
|
173
|
+
normalized_metrics = node_candidates_metrics / node_candidates_metrics[ref_ind]
|
174
|
+
if verbose and not np.array_equal(normalized_metrics, node_candidates_metrics):
|
175
|
+
print(f'{"normalized metric:":25}', candidates_sensitivity)
|
176
|
+
return normalized_metrics
|
177
|
+
|
178
|
+
def ensure_maxbit_minimal_metric(node_candidates_metrics, max_ind):
|
179
|
+
if eps is None:
|
180
|
+
return node_candidates_metrics
|
181
|
+
# We want maxbit configuration to have the minimal distance metric (so that optimization objective
|
182
|
+
# doesn't prefer lower bits). If we got a smaller metric for non-maxbit, we update it to metric(maxbit)+eps.
|
183
|
+
max_val = node_candidates_metrics[max_ind]
|
184
|
+
metrics = np.maximum(node_candidates_metrics, max_val + eps)
|
185
|
+
metrics[max_ind] = max_val
|
186
|
+
if verbose and not np.array_equal(metrics, node_candidates_metrics):
|
187
|
+
print(f'{"eps-adjusted metric:":25}', candidates_sensitivity)
|
188
|
+
return metrics
|
177
189
|
|
178
190
|
layer_to_metrics_mapping = defaultdict(list)
|
179
191
|
for node_idx, node in tqdm(enumerate(self.mp_topo_configurable_nodes)):
|
192
|
+
candidates_sensitivity = np.empty(len(node.candidates_quantization_cfg))
|
180
193
|
for bitwidth_idx, _ in enumerate(node.candidates_quantization_cfg):
|
181
|
-
if self.max_ru_config[node] == bitwidth_idx:
|
182
|
-
# This is a computation of the metric for the max configuration, assign pre-calculated value
|
183
|
-
layer_to_metrics_mapping[node].append(max_config_value)
|
184
|
-
continue
|
185
|
-
|
186
|
-
# Create a configuration that differs at one layer only from the baseline model
|
187
|
-
mp_model_configuration = self.max_ru_config.copy()
|
188
|
-
mp_model_configuration[node] = bitwidth_idx
|
189
|
-
|
190
|
-
# Build a distance matrix using the function we got from the framework implementation.
|
191
194
|
if self.using_virtual_graph:
|
192
|
-
|
193
|
-
orig_mp_config = self.config_reconstruction_helper.reconstruct_full_configuration(mp_model_configuration)
|
194
|
-
changed_nodes = [orig_sorted_nodes.index(n) for n, ind in orig_mp_config.items()
|
195
|
-
if origin_max_config[n] != ind]
|
196
|
-
metric_value = compute_metric(orig_mp_config, changed_nodes, origin_max_config)
|
195
|
+
a_cfg, w_cfg = self.config_reconstructor.reconstruct_separate_aw_configs({node: bitwidth_idx})
|
197
196
|
else:
|
198
|
-
|
199
|
-
|
200
|
-
|
197
|
+
a_cfg = {node: bitwidth_idx} if node.has_configurable_activation() else {}
|
198
|
+
w_cfg = {node: bitwidth_idx} if node.has_any_configurable_weight() else {}
|
199
|
+
candidates_sensitivity[bitwidth_idx] = self.sensitivity_evaluator.compute_metric(
|
200
|
+
mp_a_cfg={n.name: ind for n, ind in a_cfg.items()},
|
201
|
+
mp_w_cfg={n.name: ind for n, ind in w_cfg.items()}
|
202
|
+
)
|
203
|
+
if verbose:
|
204
|
+
print(f'{node.name}\n{"raw metric:":25}', candidates_sensitivity)
|
205
|
+
max_ind = node.find_max_candidate_index()
|
206
|
+
candidates_sensitivity = normalize(candidates_sensitivity, max_ind)
|
207
|
+
candidates_sensitivity = ensure_maxbit_minimal_metric(candidates_sensitivity, max_ind)
|
208
|
+
layer_to_metrics_mapping[node] = candidates_sensitivity
|
201
209
|
|
202
210
|
# Finalize distance metric mapping
|
203
211
|
self._finalize_distance_metric(layer_to_metrics_mapping)
|
@@ -244,8 +252,9 @@ class MixedPrecisionSearchManager:
|
|
244
252
|
else:
|
245
253
|
cfg = self.min_ru_config.copy()
|
246
254
|
cfg[node] = candidate_idx
|
247
|
-
|
248
|
-
|
255
|
+
if self.using_virtual_graph:
|
256
|
+
cfg = self.config_reconstructor.reconstruct_full_configuration(cfg)
|
257
|
+
candidate_rus = self.orig_graph_ru_helper.compute_utilization(self.ru_targets, cfg)
|
249
258
|
|
250
259
|
for target, ru in candidate_rus.items():
|
251
260
|
rus_per_candidate[target].append(ru)
|
@@ -283,8 +292,8 @@ class MixedPrecisionSearchManager:
|
|
283
292
|
with the given config.
|
284
293
|
|
285
294
|
"""
|
286
|
-
act_qcs, w_qcs = self.
|
287
|
-
ru = self.
|
295
|
+
act_qcs, w_qcs = self.orig_graph_ru_helper.get_quantization_candidates(config)
|
296
|
+
ru = self.orig_graph_ru_helper.ru_calculator.compute_resource_utilization(
|
288
297
|
target_criterion=TargetInclusionCriterion.AnyQuantized, bitwidth_mode=BitwidthMode.QCustom, act_qcs=act_qcs,
|
289
298
|
w_qcs=w_qcs, ru_targets=self.ru_targets, allow_unused_qcs=True)
|
290
299
|
return ru
|
@@ -303,7 +312,7 @@ class MixedPrecisionSearchManager:
|
|
303
312
|
# normalize metric for numerical stability
|
304
313
|
max_dist = max(itertools.chain.from_iterable(layer_to_metrics_mapping.values()))
|
305
314
|
|
306
|
-
if max_dist >= self.
|
315
|
+
if max_dist >= self.mp_config.metric_normalization_threshold:
|
307
316
|
Logger.warning(f"The mixed precision distance metric values indicate a large error in the quantized model."
|
308
317
|
f"this can cause numerical issues."
|
309
318
|
f"The program will proceed with mixed precision search after scaling the metric values,"
|
@@ -387,7 +396,9 @@ class ConfigReconstructionHelper:
|
|
387
396
|
|
388
397
|
return orig_cfg
|
389
398
|
|
390
|
-
def reconstruct_separate_aw_configs(self,
|
399
|
+
def reconstruct_separate_aw_configs(self,
|
400
|
+
virtual_cfg: Dict[BaseNode, int],
|
401
|
+
include_non_configurable: bool = False) \
|
391
402
|
-> Tuple[Dict[BaseNode, int], Dict[BaseNode, int]]:
|
392
403
|
"""
|
393
404
|
Retrieves original activation and weights nodes and corresponding candidates for a given configuration of the
|