mct-nightly 1.8.0.22042023.post414__py3-none-any.whl → 1.8.0.22052023.post408__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (238) hide show
  1. {mct_nightly-1.8.0.22042023.post414.dist-info → mct_nightly-1.8.0.22052023.post408.dist-info}/METADATA +1 -1
  2. {mct_nightly-1.8.0.22042023.post414.dist-info → mct_nightly-1.8.0.22052023.post408.dist-info}/RECORD +237 -230
  3. model_compression_toolkit/__init__.py +8 -31
  4. model_compression_toolkit/{core/common/constants.py → constants.py} +2 -6
  5. model_compression_toolkit/core/__init__.py +14 -0
  6. model_compression_toolkit/core/analyzer.py +3 -2
  7. model_compression_toolkit/core/common/__init__.py +0 -1
  8. model_compression_toolkit/core/common/collectors/base_collector.py +1 -1
  9. model_compression_toolkit/core/common/collectors/mean_collector.py +1 -1
  10. model_compression_toolkit/core/common/collectors/min_max_per_channel_collector.py +1 -1
  11. model_compression_toolkit/core/common/framework_implementation.py +1 -8
  12. model_compression_toolkit/core/common/fusion/layer_fusing.py +2 -2
  13. model_compression_toolkit/core/common/graph/base_graph.py +1 -1
  14. model_compression_toolkit/core/common/graph/base_node.py +57 -1
  15. model_compression_toolkit/core/common/graph/memory_graph/bipartite_graph.py +1 -1
  16. model_compression_toolkit/core/common/graph/memory_graph/max_cut_astar.py +1 -1
  17. model_compression_toolkit/core/common/graph/virtual_activation_weights_node.py +2 -2
  18. model_compression_toolkit/core/common/memory_computation.py +1 -1
  19. model_compression_toolkit/core/common/mixed_precision/bit_width_setter.py +1 -1
  20. model_compression_toolkit/core/common/mixed_precision/kpi_tools/kpi_data.py +2 -3
  21. model_compression_toolkit/core/common/mixed_precision/kpi_tools/kpi_methods.py +3 -3
  22. model_compression_toolkit/core/common/mixed_precision/mixed_precision_quantization_config.py +1 -1
  23. model_compression_toolkit/core/common/mixed_precision/mixed_precision_search_facade.py +3 -2
  24. model_compression_toolkit/core/common/mixed_precision/mixed_precision_search_manager.py +1 -1
  25. model_compression_toolkit/core/common/mixed_precision/search_methods/linear_programming.py +1 -1
  26. model_compression_toolkit/core/common/mixed_precision/sensitivity_evaluation.py +2 -2
  27. model_compression_toolkit/core/common/mixed_precision/solution_refinement_procedure.py +2 -2
  28. model_compression_toolkit/core/common/model_collector.py +2 -2
  29. model_compression_toolkit/core/common/model_validation.py +1 -1
  30. model_compression_toolkit/core/common/network_editors/actions.py +4 -1
  31. model_compression_toolkit/core/common/quantization/candidate_node_quantization_config.py +1 -1
  32. model_compression_toolkit/core/common/quantization/filter_nodes_candidates.py +1 -1
  33. model_compression_toolkit/core/common/quantization/node_quantization_config.py +1 -1
  34. model_compression_toolkit/core/common/quantization/quantization_config.py +2 -2
  35. model_compression_toolkit/core/common/quantization/quantization_params_fn_selection.py +1 -1
  36. model_compression_toolkit/core/common/quantization/quantization_params_generation/error_functions.py +1 -1
  37. model_compression_toolkit/core/common/quantization/quantization_params_generation/kmeans_params.py +1 -1
  38. model_compression_toolkit/core/common/quantization/quantization_params_generation/lut_kmeans_params.py +2 -2
  39. model_compression_toolkit/core/common/quantization/quantization_params_generation/power_of_two_selection.py +1 -1
  40. model_compression_toolkit/core/common/quantization/quantization_params_generation/qparams_activations_computation.py +2 -2
  41. model_compression_toolkit/core/common/quantization/quantization_params_generation/qparams_computation.py +1 -1
  42. model_compression_toolkit/core/common/quantization/quantization_params_generation/qparams_search.py +1 -1
  43. model_compression_toolkit/core/common/quantization/quantization_params_generation/qparams_weights_computation.py +1 -1
  44. model_compression_toolkit/core/common/quantization/quantization_params_generation/symmetric_selection.py +1 -1
  45. model_compression_toolkit/core/common/quantization/quantization_params_generation/uniform_selection.py +1 -1
  46. model_compression_toolkit/core/common/quantization/quantize_graph_weights.py +2 -1
  47. model_compression_toolkit/core/common/quantization/quantize_node.py +2 -2
  48. model_compression_toolkit/core/common/quantization/quantizers/kmeans_quantizer.py +1 -1
  49. model_compression_toolkit/core/common/quantization/quantizers/lut_kmeans_quantizer.py +1 -1
  50. model_compression_toolkit/core/common/quantization/quantizers/quantizers_helpers.py +4 -2
  51. model_compression_toolkit/core/common/quantization/quantizers/uniform_quantizers.py +2 -2
  52. model_compression_toolkit/core/common/quantization/set_node_quantization_config.py +3 -2
  53. model_compression_toolkit/core/common/similarity_analyzer.py +2 -2
  54. model_compression_toolkit/core/common/statistics_correction/apply_bias_correction_to_graph.py +4 -3
  55. model_compression_toolkit/core/common/statistics_correction/compute_bias_correction_of_graph.py +3 -2
  56. model_compression_toolkit/core/common/substitutions/batchnorm_reconstruction.py +1 -1
  57. model_compression_toolkit/core/common/substitutions/batchnorm_refusing.py +2 -2
  58. model_compression_toolkit/core/common/substitutions/linear_collapsing.py +1 -1
  59. model_compression_toolkit/core/common/substitutions/shift_negative_activation.py +4 -4
  60. model_compression_toolkit/core/common/substitutions/virtual_activation_weights_composition.py +1 -1
  61. model_compression_toolkit/core/common/substitutions/weights_activation_split.py +1 -1
  62. model_compression_toolkit/core/common/visualization/tensorboard_writer.py +1 -1
  63. model_compression_toolkit/core/keras/back2framework/factory_model_builder.py +1 -1
  64. model_compression_toolkit/core/keras/back2framework/float_model_builder.py +1 -1
  65. model_compression_toolkit/core/keras/back2framework/keras_model_builder.py +66 -21
  66. model_compression_toolkit/core/keras/back2framework/mixed_precision_model_builder.py +1 -1
  67. model_compression_toolkit/core/keras/back2framework/model_gradients.py +2 -2
  68. model_compression_toolkit/core/keras/back2framework/quantized_model_builder.py +1 -1
  69. model_compression_toolkit/core/keras/constants.py +0 -7
  70. model_compression_toolkit/core/keras/default_framework_info.py +2 -2
  71. model_compression_toolkit/core/keras/graph_substitutions/substitutions/activation_decomposition.py +1 -1
  72. model_compression_toolkit/core/keras/graph_substitutions/substitutions/input_scaling.py +1 -1
  73. model_compression_toolkit/core/keras/graph_substitutions/substitutions/linear_collapsing.py +1 -1
  74. model_compression_toolkit/core/keras/graph_substitutions/substitutions/multi_head_attention_decomposition.py +3 -4
  75. model_compression_toolkit/core/keras/graph_substitutions/substitutions/relu_bound_to_power_of_2.py +2 -1
  76. model_compression_toolkit/core/keras/graph_substitutions/substitutions/remove_relu_upper_bound.py +3 -2
  77. model_compression_toolkit/core/keras/graph_substitutions/substitutions/residual_collapsing.py +1 -1
  78. model_compression_toolkit/core/keras/graph_substitutions/substitutions/shift_negative_activation.py +1 -1
  79. model_compression_toolkit/core/keras/keras_implementation.py +2 -10
  80. model_compression_toolkit/core/keras/keras_model_validation.py +1 -1
  81. model_compression_toolkit/core/keras/keras_node_prior_info.py +1 -1
  82. model_compression_toolkit/core/keras/kpi_data_facade.py +7 -7
  83. model_compression_toolkit/core/keras/quantizer/fake_quant_builder.py +2 -2
  84. model_compression_toolkit/core/keras/quantizer/input_layer_quantize_transform.py +1 -1
  85. model_compression_toolkit/core/keras/quantizer/lut_fake_quant.py +2 -2
  86. model_compression_toolkit/core/keras/quantizer/mixed_precision/selective_quantize_config.py +1 -1
  87. model_compression_toolkit/core/keras/reader/common.py +1 -1
  88. model_compression_toolkit/core/keras/statistics_correction/apply_second_moment_correction.py +1 -1
  89. model_compression_toolkit/core/pytorch/back2framework/factory_model_builder.py +1 -1
  90. model_compression_toolkit/core/pytorch/back2framework/float_model_builder.py +1 -1
  91. model_compression_toolkit/core/pytorch/back2framework/mixed_precision_model_builder.py +1 -1
  92. model_compression_toolkit/core/pytorch/back2framework/model_gradients.py +2 -2
  93. model_compression_toolkit/core/pytorch/back2framework/pytorch_model_builder.py +1 -1
  94. model_compression_toolkit/core/pytorch/back2framework/quantized_model_builder.py +1 -1
  95. model_compression_toolkit/core/pytorch/constants.py +0 -6
  96. model_compression_toolkit/core/pytorch/default_framework_info.py +1 -1
  97. model_compression_toolkit/core/pytorch/graph_substitutions/substitutions/linear_collapsing.py +1 -1
  98. model_compression_toolkit/core/pytorch/graph_substitutions/substitutions/multi_head_attention_decomposition.py +1 -1
  99. model_compression_toolkit/core/pytorch/graph_substitutions/substitutions/relu_bound_to_power_of_2.py +3 -2
  100. model_compression_toolkit/core/pytorch/graph_substitutions/substitutions/reshape_with_static_shapes.py +1 -1
  101. model_compression_toolkit/core/pytorch/graph_substitutions/substitutions/residual_collapsing.py +1 -1
  102. model_compression_toolkit/core/pytorch/graph_substitutions/substitutions/shift_negative_activation.py +1 -1
  103. model_compression_toolkit/core/pytorch/kpi_data_facade.py +6 -6
  104. model_compression_toolkit/core/pytorch/mixed_precision/mixed_precision_wrapper.py +1 -1
  105. model_compression_toolkit/core/pytorch/pytorch_implementation.py +1 -9
  106. model_compression_toolkit/core/pytorch/pytorch_node_prior_info.py +1 -1
  107. model_compression_toolkit/core/pytorch/quantizer/fake_quant_builder.py +2 -2
  108. model_compression_toolkit/core/pytorch/quantizer/lut_fake_quant.py +1 -1
  109. model_compression_toolkit/core/pytorch/reader/graph_builders.py +3 -2
  110. model_compression_toolkit/core/pytorch/statistics_correction/apply_second_moment_correction.py +1 -1
  111. model_compression_toolkit/core/runner.py +6 -6
  112. model_compression_toolkit/exporter/__init__.py +6 -3
  113. model_compression_toolkit/exporter/model_exporter/fw_agonstic/exporter.py +1 -1
  114. model_compression_toolkit/exporter/model_exporter/keras/export_serialization_format.py +20 -0
  115. model_compression_toolkit/exporter/model_exporter/keras/fakely_quant_keras_exporter.py +1 -1
  116. model_compression_toolkit/exporter/model_exporter/{tflite → keras}/fakely_quant_tflite_exporter.py +1 -1
  117. model_compression_toolkit/exporter/model_exporter/{tflite → keras}/int8_tflite_exporter.py +1 -1
  118. model_compression_toolkit/exporter/model_exporter/keras/keras_export_facade.py +60 -22
  119. model_compression_toolkit/exporter/model_exporter/pytorch/export_serialization_format.py +20 -0
  120. model_compression_toolkit/exporter/model_exporter/pytorch/fakely_quant_onnx_pytorch_exporter.py +15 -1
  121. model_compression_toolkit/exporter/model_exporter/pytorch/fakely_quant_torchscript_pytorch_exporter.py +1 -1
  122. model_compression_toolkit/exporter/model_exporter/pytorch/pytorch_export_facade.py +54 -31
  123. model_compression_toolkit/exporter/model_wrapper/keras/builder/fully_quantized_model_builder.py +5 -3
  124. model_compression_toolkit/exporter/model_wrapper/keras/builder/node_to_quantizer.py +4 -2
  125. model_compression_toolkit/exporter/model_wrapper/keras/validate_layer.py +2 -2
  126. model_compression_toolkit/exporter/model_wrapper/pytorch/builder/fully_quantized_model_builder.py +3 -2
  127. model_compression_toolkit/exporter/model_wrapper/pytorch/builder/node_to_quantizer.py +3 -2
  128. model_compression_toolkit/exporter/model_wrapper/pytorch/validate_layer.py +2 -2
  129. model_compression_toolkit/gptq/common/gptq_framework_implementation.py +32 -0
  130. model_compression_toolkit/gptq/common/gptq_graph.py +2 -2
  131. model_compression_toolkit/gptq/common/gptq_training.py +5 -4
  132. model_compression_toolkit/gptq/keras/gptq_keras_implementation.py +29 -0
  133. model_compression_toolkit/gptq/keras/gptq_training.py +41 -14
  134. model_compression_toolkit/gptq/keras/graph_info.py +4 -0
  135. model_compression_toolkit/gptq/keras/quantization_facade.py +26 -19
  136. model_compression_toolkit/gptq/keras/quantizer/base_keras_gptq_quantizer.py +2 -2
  137. model_compression_toolkit/gptq/keras/quantizer/quant_utils.py +1 -1
  138. model_compression_toolkit/gptq/keras/quantizer/soft_rounding/symmetric_soft_quantizer.py +1 -1
  139. model_compression_toolkit/gptq/keras/quantizer/soft_rounding/uniform_soft_quantizer.py +2 -2
  140. model_compression_toolkit/gptq/keras/quantizer/ste_rounding/symmetric_ste.py +1 -1
  141. model_compression_toolkit/gptq/pytorch/gptq_pytorch_implementation.py +29 -0
  142. model_compression_toolkit/gptq/pytorch/gptq_training.py +1 -1
  143. model_compression_toolkit/gptq/pytorch/quantization_facade.py +11 -11
  144. model_compression_toolkit/gptq/pytorch/quantizer/base_pytorch_gptq_quantizer.py +3 -3
  145. model_compression_toolkit/gptq/pytorch/quantizer/quant_utils.py +1 -3
  146. model_compression_toolkit/gptq/pytorch/quantizer/soft_rounding/symmetric_soft_quantizer.py +1 -1
  147. model_compression_toolkit/gptq/pytorch/quantizer/soft_rounding/uniform_soft_quantizer.py +2 -2
  148. model_compression_toolkit/gptq/pytorch/quantizer/ste_rounding/symmetric_ste.py +1 -1
  149. model_compression_toolkit/gptq/runner.py +3 -2
  150. model_compression_toolkit/{exporter/model_exporter/tflite → legacy}/__init__.py +1 -1
  151. model_compression_toolkit/{core/keras/quantization_facade.py → legacy/keras_quantization_facade.py} +8 -9
  152. model_compression_toolkit/{core/pytorch/quantization_facade.py → legacy/pytorch_quantization_facade.py} +8 -9
  153. model_compression_toolkit/ptq/__init__.py +3 -0
  154. model_compression_toolkit/ptq/keras/quantization_facade.py +10 -11
  155. model_compression_toolkit/ptq/pytorch/quantization_facade.py +7 -7
  156. model_compression_toolkit/qat/__init__.py +4 -0
  157. model_compression_toolkit/qat/common/__init__.py +1 -2
  158. model_compression_toolkit/qat/common/qat_config.py +5 -1
  159. model_compression_toolkit/qat/keras/quantization_facade.py +33 -27
  160. model_compression_toolkit/qat/keras/quantizer/base_keras_qat_quantizer.py +2 -2
  161. model_compression_toolkit/qat/keras/quantizer/quantization_builder.py +31 -4
  162. model_compression_toolkit/qat/keras/quantizer/ste_rounding/symmetric_ste.py +12 -10
  163. model_compression_toolkit/qat/keras/quantizer/ste_rounding/uniform_ste.py +8 -8
  164. model_compression_toolkit/qat/pytorch/quantization_facade.py +8 -8
  165. model_compression_toolkit/qat/pytorch/quantizer/base_pytorch_qat_quantizer.py +2 -2
  166. model_compression_toolkit/qat/pytorch/quantizer/ste_rounding/symmetric_ste.py +3 -2
  167. model_compression_toolkit/qat/pytorch/quantizer/ste_rounding/uniform_ste.py +6 -4
  168. model_compression_toolkit/quantizers_infrastructure/__init__.py +2 -2
  169. model_compression_toolkit/{qat/common → quantizers_infrastructure}/constants.py +2 -1
  170. model_compression_toolkit/quantizers_infrastructure/inferable_infrastructure/common/constants.py +5 -0
  171. model_compression_toolkit/quantizers_infrastructure/inferable_infrastructure/common/get_quantizers.py +1 -1
  172. model_compression_toolkit/quantizers_infrastructure/inferable_infrastructure/keras/activation_quantization_holder.py +147 -0
  173. model_compression_toolkit/quantizers_infrastructure/inferable_infrastructure/keras/load_model.py +5 -5
  174. model_compression_toolkit/quantizers_infrastructure/inferable_infrastructure/keras/quantize_wrapper.py +2 -2
  175. model_compression_toolkit/quantizers_infrastructure/inferable_infrastructure/keras/quantizers/activation_inferable_quantizers/activation_lut_pot_inferable_quantizer.py +2 -2
  176. model_compression_toolkit/quantizers_infrastructure/inferable_infrastructure/keras/quantizers/activation_inferable_quantizers/activation_pot_inferable_quantizer.py +2 -2
  177. model_compression_toolkit/quantizers_infrastructure/inferable_infrastructure/keras/quantizers/activation_inferable_quantizers/activation_symmetric_inferable_quantizer.py +1 -1
  178. model_compression_toolkit/quantizers_infrastructure/inferable_infrastructure/keras/quantizers/activation_inferable_quantizers/activation_uniform_inferable_quantizer.py +2 -2
  179. model_compression_toolkit/quantizers_infrastructure/inferable_infrastructure/keras/quantizers/base_keras_inferable_quantizer.py +1 -1
  180. model_compression_toolkit/quantizers_infrastructure/inferable_infrastructure/keras/quantizers/weights_inferable_quantizers/weights_lut_pot_inferable_quantizer.py +1 -1
  181. model_compression_toolkit/quantizers_infrastructure/inferable_infrastructure/keras/quantizers/weights_inferable_quantizers/weights_lut_symmetric_inferable_quantizer.py +1 -1
  182. model_compression_toolkit/quantizers_infrastructure/inferable_infrastructure/keras/quantizers/weights_inferable_quantizers/weights_pot_inferable_quantizer.py +1 -1
  183. model_compression_toolkit/quantizers_infrastructure/inferable_infrastructure/keras/quantizers/weights_inferable_quantizers/weights_symmetric_inferable_quantizer.py +1 -1
  184. model_compression_toolkit/quantizers_infrastructure/inferable_infrastructure/keras/quantizers/weights_inferable_quantizers/weights_uniform_inferable_quantizer.py +1 -1
  185. model_compression_toolkit/quantizers_infrastructure/inferable_infrastructure/keras/validation_functions.py +1 -1
  186. model_compression_toolkit/quantizers_infrastructure/inferable_infrastructure/pytorch/quantize_wrapper.py +2 -2
  187. model_compression_toolkit/quantizers_infrastructure/inferable_infrastructure/pytorch/quantizers/activation_inferable_quantizers/activation_lut_pot_inferable_quantizer.py +1 -2
  188. model_compression_toolkit/quantizers_infrastructure/inferable_infrastructure/pytorch/quantizers/activation_inferable_quantizers/activation_pot_inferable_quantizer.py +1 -1
  189. model_compression_toolkit/quantizers_infrastructure/inferable_infrastructure/pytorch/quantizers/activation_inferable_quantizers/activation_symmetric_inferable_quantizer.py +1 -1
  190. model_compression_toolkit/quantizers_infrastructure/inferable_infrastructure/pytorch/quantizers/activation_inferable_quantizers/activation_uniform_inferable_quantizer.py +1 -1
  191. model_compression_toolkit/quantizers_infrastructure/inferable_infrastructure/pytorch/quantizers/base_lut_symmetric_inferable_quantizer.py +1 -1
  192. model_compression_toolkit/quantizers_infrastructure/inferable_infrastructure/pytorch/quantizers/base_pytorch_inferable_quantizer.py +1 -1
  193. model_compression_toolkit/quantizers_infrastructure/inferable_infrastructure/pytorch/quantizers/base_symmetric_inferable_quantizer.py +1 -1
  194. model_compression_toolkit/quantizers_infrastructure/inferable_infrastructure/pytorch/quantizers/base_uniform_inferable_quantizer.py +1 -1
  195. model_compression_toolkit/quantizers_infrastructure/inferable_infrastructure/pytorch/quantizers/weights_inferable_quantizers/weights_lut_pot_inferable_quantizer.py +1 -1
  196. model_compression_toolkit/quantizers_infrastructure/inferable_infrastructure/pytorch/quantizers/weights_inferable_quantizers/weights_lut_symmetric_inferable_quantizer.py +1 -1
  197. model_compression_toolkit/quantizers_infrastructure/inferable_infrastructure/pytorch/quantizers/weights_inferable_quantizers/weights_pot_inferable_quantizer.py +1 -1
  198. model_compression_toolkit/quantizers_infrastructure/inferable_infrastructure/pytorch/quantizers/weights_inferable_quantizers/weights_symmetric_inferable_quantizer.py +1 -1
  199. model_compression_toolkit/quantizers_infrastructure/inferable_infrastructure/pytorch/quantizers/weights_inferable_quantizers/weights_uniform_inferable_quantizer.py +2 -2
  200. model_compression_toolkit/quantizers_infrastructure/trainable_infrastructure/common/base_trainable_quantizer.py +9 -9
  201. model_compression_toolkit/quantizers_infrastructure/trainable_infrastructure/common/get_quantizer_config.py +2 -1
  202. model_compression_toolkit/quantizers_infrastructure/trainable_infrastructure/common/get_quantizers.py +3 -5
  203. model_compression_toolkit/quantizers_infrastructure/trainable_infrastructure/keras/base_keras_quantizer.py +2 -2
  204. model_compression_toolkit/quantizers_infrastructure/trainable_infrastructure/pytorch/base_pytorch_quantizer.py +2 -2
  205. model_compression_toolkit/target_platform_capabilities/constants.py +27 -0
  206. model_compression_toolkit/target_platform_capabilities/target_platform/current_tp_model.py +1 -1
  207. model_compression_toolkit/target_platform_capabilities/target_platform/operators.py +1 -1
  208. model_compression_toolkit/target_platform_capabilities/target_platform/quantization_format.py +20 -0
  209. model_compression_toolkit/target_platform_capabilities/target_platform/target_platform_model.py +11 -2
  210. model_compression_toolkit/target_platform_capabilities/target_platform/targetplatform2framework/attribute_filter.py +1 -1
  211. model_compression_toolkit/target_platform_capabilities/target_platform/targetplatform2framework/layer_filter_params.py +32 -34
  212. model_compression_toolkit/target_platform_capabilities/target_platform/targetplatform2framework/operations_to_layers.py +2 -2
  213. model_compression_toolkit/target_platform_capabilities/target_platform/targetplatform2framework/target_platform_capabilities.py +3 -24
  214. model_compression_toolkit/target_platform_capabilities/tpc_models/default_tpc/latest/__init__.py +1 -1
  215. model_compression_toolkit/target_platform_capabilities/tpc_models/default_tpc/target_platform_capabilities.py +3 -1
  216. model_compression_toolkit/target_platform_capabilities/tpc_models/default_tpc/v1/tp_model.py +7 -1
  217. model_compression_toolkit/target_platform_capabilities/tpc_models/default_tpc/v2/tp_model.py +7 -1
  218. model_compression_toolkit/target_platform_capabilities/tpc_models/default_tpc/v3/tp_model.py +7 -1
  219. model_compression_toolkit/target_platform_capabilities/tpc_models/default_tpc/v3_lut/tp_model.py +7 -2
  220. model_compression_toolkit/target_platform_capabilities/tpc_models/default_tpc/v4/tp_model.py +7 -1
  221. model_compression_toolkit/target_platform_capabilities/tpc_models/default_tpc/v4_lut/tp_model.py +7 -2
  222. model_compression_toolkit/target_platform_capabilities/tpc_models/default_tpc/v5/tp_model.py +7 -1
  223. model_compression_toolkit/target_platform_capabilities/tpc_models/get_target_platform_capabilities.py +1 -3
  224. model_compression_toolkit/target_platform_capabilities/tpc_models/imx500_tpc/latest/__init__.py +1 -1
  225. model_compression_toolkit/target_platform_capabilities/tpc_models/imx500_tpc/target_platform_capabilities.py +2 -1
  226. model_compression_toolkit/target_platform_capabilities/tpc_models/imx500_tpc/v1/tp_model.py +7 -1
  227. model_compression_toolkit/target_platform_capabilities/tpc_models/qnnpack_tpc/latest/__init__.py +1 -1
  228. model_compression_toolkit/target_platform_capabilities/tpc_models/qnnpack_tpc/target_platform_capabilities.py +2 -1
  229. model_compression_toolkit/target_platform_capabilities/tpc_models/qnnpack_tpc/v1/tp_model.py +7 -1
  230. model_compression_toolkit/target_platform_capabilities/tpc_models/tflite_tpc/latest/__init__.py +1 -1
  231. model_compression_toolkit/target_platform_capabilities/tpc_models/tflite_tpc/target_platform_capabilities.py +2 -1
  232. model_compression_toolkit/target_platform_capabilities/tpc_models/tflite_tpc/v1/tp_model.py +26 -18
  233. model_compression_toolkit/exporter/model_exporter/tflite/tflite_export_facade.py +0 -73
  234. {mct_nightly-1.8.0.22042023.post414.dist-info → mct_nightly-1.8.0.22052023.post408.dist-info}/LICENSE.md +0 -0
  235. {mct_nightly-1.8.0.22042023.post414.dist-info → mct_nightly-1.8.0.22052023.post408.dist-info}/WHEEL +0 -0
  236. {mct_nightly-1.8.0.22042023.post414.dist-info → mct_nightly-1.8.0.22052023.post408.dist-info}/top_level.txt +0 -0
  237. /model_compression_toolkit/{core/common/logger.py → logger.py} +0 -0
  238. /model_compression_toolkit/{core/common → target_platform_capabilities}/immutable.py +0 -0
@@ -15,8 +15,12 @@
15
15
  from typing import List, Tuple
16
16
 
17
17
  import model_compression_toolkit as mct
18
- from model_compression_toolkit.target_platform_capabilities.target_platform import OpQuantizationConfig, TargetPlatformModel
19
- from model_compression_toolkit.target_platform_capabilities.target_platform.op_quantization_config import QuantizationMethod
18
+ from model_compression_toolkit.target_platform_capabilities.target_platform import OpQuantizationConfig, \
19
+ TargetPlatformModel
20
+ from model_compression_toolkit.target_platform_capabilities.target_platform.op_quantization_config import \
21
+ QuantizationMethod
22
+ from model_compression_toolkit.target_platform_capabilities.target_platform.quantization_format import \
23
+ QuantizationFormat
20
24
 
21
25
  tp = mct.target_platform
22
26
 
@@ -65,7 +69,7 @@ def get_op_quantization_configs() -> Tuple[OpQuantizationConfig, List[OpQuantiza
65
69
  weights_multiplier_nbits=None
66
70
  )
67
71
 
68
- mixed_precision_cfg_list = [] # No mixed precision
72
+ mixed_precision_cfg_list = [] # No mixed precision
69
73
 
70
74
  return eight_bits, mixed_precision_cfg_list
71
75
 
@@ -106,28 +110,28 @@ def generate_tp_model(default_config: OpQuantizationConfig,
106
110
  # differently. For more details:
107
111
  # https://www.tensorflow.org/lite/performance/quantization_spec#int8_quantized_operator_specifications
108
112
  tp.OperatorsSet("NoQuantization",
109
- tp.get_default_quantization_config_options().clone_and_edit(
110
- quantization_preserving=True))
113
+ tp.get_default_quantization_config_options().clone_and_edit(
114
+ quantization_preserving=True))
111
115
 
112
116
  fc = tp.OperatorsSet("FullyConnected",
113
- tp.get_default_quantization_config_options().clone_and_edit(
114
- weights_per_channel_threshold=False))
117
+ tp.get_default_quantization_config_options().clone_and_edit(
118
+ weights_per_channel_threshold=False))
115
119
 
116
120
  tp.OperatorsSet("L2Normalization",
117
- tp.get_default_quantization_config_options().clone_and_edit(
118
- fixed_zero_point=0, fixed_scale=1 / 128))
121
+ tp.get_default_quantization_config_options().clone_and_edit(
122
+ fixed_zero_point=0, fixed_scale=1 / 128))
119
123
  tp.OperatorsSet("LogSoftmax",
120
- tp.get_default_quantization_config_options().clone_and_edit(
121
- fixed_zero_point=127, fixed_scale=16 / 256))
124
+ tp.get_default_quantization_config_options().clone_and_edit(
125
+ fixed_zero_point=127, fixed_scale=16 / 256))
122
126
  tp.OperatorsSet("Tanh",
123
- tp.get_default_quantization_config_options().clone_and_edit(
124
- fixed_zero_point=0, fixed_scale=1 / 128))
127
+ tp.get_default_quantization_config_options().clone_and_edit(
128
+ fixed_zero_point=0, fixed_scale=1 / 128))
125
129
  tp.OperatorsSet("Softmax",
126
- tp.get_default_quantization_config_options().clone_and_edit(
127
- fixed_zero_point=-128, fixed_scale=1 / 256))
130
+ tp.get_default_quantization_config_options().clone_and_edit(
131
+ fixed_zero_point=-128, fixed_scale=1 / 256))
128
132
  tp.OperatorsSet("Logistic",
129
- tp.get_default_quantization_config_options().clone_and_edit(
130
- fixed_zero_point=-128, fixed_scale=1 / 256))
133
+ tp.get_default_quantization_config_options().clone_and_edit(
134
+ fixed_zero_point=-128, fixed_scale=1 / 256))
131
135
 
132
136
  conv2d = tp.OperatorsSet("Conv2d")
133
137
  kernel = tp.OperatorSetConcat(conv2d, fc)
@@ -140,7 +144,8 @@ def generate_tp_model(default_config: OpQuantizationConfig,
140
144
  bias_add = tp.OperatorsSet("BiasAdd")
141
145
  add = tp.OperatorsSet("Add")
142
146
  squeeze = tp.OperatorsSet("Squeeze",
143
- qc_options=tp.get_default_quantization_config_options().clone_and_edit(quantization_preserving=True))
147
+ qc_options=tp.get_default_quantization_config_options().clone_and_edit(
148
+ quantization_preserving=True))
144
149
  # ------------------- #
145
150
  # Fusions
146
151
  # ------------------- #
@@ -152,4 +157,7 @@ def generate_tp_model(default_config: OpQuantizationConfig,
152
157
  tp.Fusing([batch_norm, activations_to_fuse])
153
158
  tp.Fusing([batch_norm, add, activations_to_fuse])
154
159
 
160
+ # Set quantization format to int8
161
+ generated_tpc.set_quantization_format(QuantizationFormat.INT8)
162
+
155
163
  return generated_tpc
@@ -1,73 +0,0 @@
1
- # Copyright 2022 Sony Semiconductor Israel, Inc. All rights reserved.
2
- #
3
- # Licensed under the Apache License, Version 2.0 (the "License");
4
- # you may not use this file except in compliance with the License.
5
- # You may obtain a copy of the License at
6
- #
7
- # http://www.apache.org/licenses/LICENSE-2.0
8
- #
9
- # Unless required by applicable law or agreed to in writing, software
10
- # distributed under the License is distributed on an "AS IS" BASIS,
11
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12
- # See the License for the specific language governing permissions and
13
- # limitations under the License.
14
- # ==============================================================================
15
- from enum import Enum
16
- from typing import Callable
17
-
18
- from model_compression_toolkit.core.common import Logger
19
- from model_compression_toolkit.core.common.constants import FOUND_TF
20
-
21
-
22
- class TFLiteExportMode(Enum):
23
- FAKELY_QUANT = 0
24
- INT8 = 1
25
-
26
- if FOUND_TF:
27
- import keras
28
- from model_compression_toolkit.exporter.model_exporter.tflite.fakely_quant_tflite_exporter import FakelyQuantTFLiteExporter
29
- from model_compression_toolkit.exporter.model_exporter.tflite.int8_tflite_exporter import INT8TFLiteExporter
30
- from model_compression_toolkit.exporter.model_wrapper.keras.validate_layer import is_keras_layer_exportable
31
-
32
- def tflite_export_model(model: keras.models.Model,
33
- save_model_path: str,
34
- mode: TFLiteExportMode = TFLiteExportMode.FAKELY_QUANT,
35
- is_layer_exportable_fn: Callable = is_keras_layer_exportable
36
- ):
37
- """
38
- Export a Keras quantized model to a tflite model.
39
- The model will be saved to the path in save_model_path.
40
- Mode can be used for different exported files. Currently, tflite_export_model
41
- supports TFLiteExportMode.FAKELY_QUANT (where weights and activations are
42
- float fakely-quantized values), and TFLiteExportMode.INT8 (where weights
43
- and activations are represented using 8bits integers).
44
-
45
- Args:
46
- model: Model to export.
47
- is_layer_exportable_fn: Callable to check whether a layer can be exported or not.
48
- mode: Mode to export the model according to.
49
- save_model_path: Path to save the model.
50
-
51
- """
52
-
53
- if mode == TFLiteExportMode.FAKELY_QUANT:
54
- exporter = FakelyQuantTFLiteExporter(model,
55
- is_layer_exportable_fn,
56
- save_model_path)
57
- elif mode == TFLiteExportMode.INT8:
58
- exporter = INT8TFLiteExporter(model,
59
- is_layer_exportable_fn,
60
- save_model_path)
61
-
62
- else:
63
- Logger.critical(
64
- f'Unsupported mode was used {mode.name} to export TFLite model.'
65
- f' Please see API for supported modes.') # pragma: no cover
66
-
67
- exporter.export()
68
-
69
- else:
70
- def tflite_export_model(*args, **kwargs):
71
- Logger.error('Installing tensorflow and tensorflow_model_optimization is mandatory '
72
- 'when using tflite_export_model. '
73
- 'Could not find some or all of TensorFlow packages.') # pragma: no cover