neural-compressor 2.2__tar.gz → 2.3__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (965) hide show
  1. neural_compressor-2.3/PKG-INFO +191 -0
  2. neural_compressor-2.3/README.md +160 -0
  3. neural_compressor-2.3/neural_coder/__init__.py +20 -0
  4. neural_compressor-2.3/neural_coder/backends/nano_bf16.yaml +27 -0
  5. neural_compressor-2.3/neural_coder/backends/nano_bf16_channels_last.yaml +27 -0
  6. neural_compressor-2.3/neural_coder/backends/nano_bf16_ipex.yaml +27 -0
  7. neural_compressor-2.3/neural_coder/backends/nano_bf16_ipex_channels_last.yaml +27 -0
  8. neural_compressor-2.3/neural_coder/backends/nano_fp32_channels_last.yaml +27 -0
  9. neural_compressor-2.3/neural_coder/backends/nano_fp32_ipex.yaml +27 -0
  10. neural_compressor-2.3/neural_coder/backends/nano_fp32_ipex_channels_last.yaml +27 -0
  11. neural_compressor-2.3/neural_coder/backends/nano_gpu_to_cpu.yaml +24 -0
  12. neural_compressor-2.3/neural_coder/backends/nano_int8.yaml +27 -0
  13. neural_compressor-2.3/neural_coder/backends/nano_jit_bf16.yaml +27 -0
  14. neural_compressor-2.3/neural_coder/backends/nano_jit_bf16_channels_last.yaml +27 -0
  15. neural_compressor-2.3/neural_coder/backends/nano_jit_bf16_ipex.yaml +27 -0
  16. neural_compressor-2.3/neural_coder/backends/nano_jit_bf16_ipex_channels_last.yaml +27 -0
  17. neural_compressor-2.3/neural_coder/backends/nano_jit_fp32_channels_last.yaml +27 -0
  18. neural_compressor-2.3/neural_coder/backends/nano_jit_fp32_ipex_channels_last.yaml +27 -0
  19. neural_compressor-2.3/neural_coder/backends/nano_onnxruntime_fp32.yaml +27 -0
  20. neural_compressor-2.3/neural_coder/backends/nano_onnxruntime_int8_qlinear.yaml +27 -0
  21. neural_compressor-2.3/neural_coder/backends/nano_openvino_fp32.yaml +27 -0
  22. neural_compressor-2.3/neural_coder/backends/nano_openvino_int8.yaml +27 -0
  23. neural_compressor-2.3/neural_coder/backends/pytorch_aliblade.yaml +25 -0
  24. neural_compressor-2.3/neural_coder/backends/pytorch_inc_static_quant_fx.yaml +46 -0
  25. neural_compressor-2.3/neural_coder/backends/pytorch_inc_static_quant_fx_fp8.yaml +46 -0
  26. neural_compressor-2.3/neural_coder/backends/pytorch_jit_script.yaml +36 -0
  27. neural_compressor-2.3/neural_coder/backends/pytorch_jit_script_ofi.yaml +35 -0
  28. neural_compressor-2.3/neural_coder/backends/pytorch_mixed_precision_cpu.yaml +28 -0
  29. neural_compressor-2.3/neural_coder/coders/autoinc/autoinc_harness.py +476 -0
  30. neural_compressor-2.3/neural_coder/coders/autoinc/calib_dataloader.py +45 -0
  31. neural_compressor-2.3/neural_coder/coders/autoinc/domain.py +34 -0
  32. neural_compressor-2.3/neural_coder/coders/autoinc/eval_func.py +111 -0
  33. neural_compressor-2.3/neural_coder/coders/pytorch/batch_size.py +83 -0
  34. neural_compressor-2.3/neural_coder/coders/pytorch/change_trainer_to_nlptrainer.py +47 -0
  35. neural_compressor-2.3/neural_coder/coders/pytorch/cuda_to_cpu.py +86 -0
  36. neural_compressor-2.3/neural_coder/coders/pytorch/dummy_dataloader.py +124 -0
  37. neural_compressor-2.3/neural_coder/coders/pytorch/harness.py +421 -0
  38. neural_compressor-2.3/neural_coder/coders/pytorch/lightning.py +86 -0
  39. neural_compressor-2.3/neural_coder/coders/pytorch/reclaim_inference_transformers_trainer.py +75 -0
  40. neural_compressor-2.3/neural_coder/coders/pytorch/reclaim_inputs.py +106 -0
  41. neural_compressor-2.3/neural_coder/coders/tensorflow/amp.py +64 -0
  42. neural_compressor-2.3/neural_coder/coders/tensorflow/inc.py +50 -0
  43. neural_compressor-2.3/neural_coder/coders/transform.py +84 -0
  44. neural_compressor-2.3/neural_coder/globals.py +117 -0
  45. neural_compressor-2.3/neural_coder/graphers/code_line.py +278 -0
  46. neural_compressor-2.3/neural_coder/graphers/function.py +189 -0
  47. neural_compressor-2.3/neural_coder/graphers/model.py +290 -0
  48. neural_compressor-2.3/neural_coder/graphers/preloads/transformers.yaml +2160 -0
  49. neural_compressor-2.3/neural_coder/interface.py +1333 -0
  50. neural_compressor-2.3/neural_coder/launcher.py +103 -0
  51. neural_compressor-2.3/neural_coder/utils/common.py +27 -0
  52. neural_compressor-2.3/neural_coder/utils/cpu_info.py +44 -0
  53. neural_compressor-2.3/neural_coder/utils/device.py +89 -0
  54. neural_compressor-2.3/neural_coder/utils/handle_user_input.py +237 -0
  55. neural_compressor-2.3/neural_coder/utils/line_operation.py +148 -0
  56. neural_compressor-2.3/neural_coder/utils/numa_launcher.py +913 -0
  57. neural_compressor-2.3/neural_coder/utils/pdf_report.py +424 -0
  58. neural_compressor-2.3/neural_compressor/__init__.py +32 -0
  59. neural_compressor-2.3/neural_compressor/adaptor/__init__.py +28 -0
  60. neural_compressor-2.3/neural_compressor/adaptor/adaptor.py +199 -0
  61. neural_compressor-2.3/neural_compressor/adaptor/keras.py +1024 -0
  62. neural_compressor-2.3/neural_compressor/adaptor/keras.yaml +121 -0
  63. neural_compressor-2.3/neural_compressor/adaptor/keras_utils/__init__.py +16 -0
  64. neural_compressor-2.3/neural_compressor/adaptor/keras_utils/conv2d.py +109 -0
  65. neural_compressor-2.3/neural_compressor/adaptor/keras_utils/dense.py +82 -0
  66. neural_compressor-2.3/neural_compressor/adaptor/keras_utils/depthwise_conv2d.py +139 -0
  67. neural_compressor-2.3/neural_compressor/adaptor/keras_utils/pool2d.py +59 -0
  68. neural_compressor-2.3/neural_compressor/adaptor/keras_utils/quantizer.py +137 -0
  69. neural_compressor-2.3/neural_compressor/adaptor/keras_utils/separable_conv2d.py +124 -0
  70. neural_compressor-2.3/neural_compressor/adaptor/mxnet.py +512 -0
  71. neural_compressor-2.3/neural_compressor/adaptor/mxnet.yaml +355 -0
  72. neural_compressor-2.3/neural_compressor/adaptor/mxnet_utils/__init__.py +17 -0
  73. neural_compressor-2.3/neural_compressor/adaptor/mxnet_utils/util.py +924 -0
  74. neural_compressor-2.3/neural_compressor/adaptor/onnxrt.py +2025 -0
  75. neural_compressor-2.3/neural_compressor/adaptor/onnxrt.yaml +446 -0
  76. neural_compressor-2.3/neural_compressor/adaptor/onnxrt_cuda.yaml +443 -0
  77. neural_compressor-2.3/neural_compressor/adaptor/onnxrt_dml.yaml +67 -0
  78. neural_compressor-2.3/neural_compressor/adaptor/onnxrt_dnnl.yaml +417 -0
  79. neural_compressor-2.3/neural_compressor/adaptor/onnxrt_trt.yaml +141 -0
  80. neural_compressor-2.3/neural_compressor/adaptor/ox_utils/calibration.py +759 -0
  81. neural_compressor-2.3/neural_compressor/adaptor/ox_utils/calibrator.py +405 -0
  82. neural_compressor-2.3/neural_compressor/adaptor/ox_utils/operators/__init__.py +29 -0
  83. neural_compressor-2.3/neural_compressor/adaptor/ox_utils/operators/activation.py +150 -0
  84. neural_compressor-2.3/neural_compressor/adaptor/ox_utils/operators/argmax.py +51 -0
  85. neural_compressor-2.3/neural_compressor/adaptor/ox_utils/operators/attention.py +130 -0
  86. neural_compressor-2.3/neural_compressor/adaptor/ox_utils/operators/binary_op.py +195 -0
  87. neural_compressor-2.3/neural_compressor/adaptor/ox_utils/operators/concat.py +179 -0
  88. neural_compressor-2.3/neural_compressor/adaptor/ox_utils/operators/conv.py +245 -0
  89. neural_compressor-2.3/neural_compressor/adaptor/ox_utils/operators/direct_q8.py +93 -0
  90. neural_compressor-2.3/neural_compressor/adaptor/ox_utils/operators/embed_layernorm.py +121 -0
  91. neural_compressor-2.3/neural_compressor/adaptor/ox_utils/operators/gather.py +125 -0
  92. neural_compressor-2.3/neural_compressor/adaptor/ox_utils/operators/gavgpool.py +95 -0
  93. neural_compressor-2.3/neural_compressor/adaptor/ox_utils/operators/gemm.py +165 -0
  94. neural_compressor-2.3/neural_compressor/adaptor/ox_utils/operators/lstm.py +137 -0
  95. neural_compressor-2.3/neural_compressor/adaptor/ox_utils/operators/matmul.py +205 -0
  96. neural_compressor-2.3/neural_compressor/adaptor/ox_utils/operators/maxpool.py +86 -0
  97. neural_compressor-2.3/neural_compressor/adaptor/ox_utils/operators/norm.py +48 -0
  98. neural_compressor-2.3/neural_compressor/adaptor/ox_utils/operators/ops.py +154 -0
  99. neural_compressor-2.3/neural_compressor/adaptor/ox_utils/operators/pad.py +112 -0
  100. neural_compressor-2.3/neural_compressor/adaptor/ox_utils/operators/pooling.py +120 -0
  101. neural_compressor-2.3/neural_compressor/adaptor/ox_utils/operators/reduce.py +85 -0
  102. neural_compressor-2.3/neural_compressor/adaptor/ox_utils/operators/resize.py +87 -0
  103. neural_compressor-2.3/neural_compressor/adaptor/ox_utils/operators/split.py +156 -0
  104. neural_compressor-2.3/neural_compressor/adaptor/ox_utils/operators/unary_op.py +83 -0
  105. neural_compressor-2.3/neural_compressor/adaptor/ox_utils/quantizer.py +1301 -0
  106. neural_compressor-2.3/neural_compressor/adaptor/ox_utils/smooth_quant.py +709 -0
  107. neural_compressor-2.3/neural_compressor/adaptor/ox_utils/util.py +586 -0
  108. neural_compressor-2.3/neural_compressor/adaptor/ox_utils/weight_only.py +1054 -0
  109. neural_compressor-2.3/neural_compressor/adaptor/pytorch.py +4926 -0
  110. neural_compressor-2.3/neural_compressor/adaptor/pytorch_cpu.yaml +447 -0
  111. neural_compressor-2.3/neural_compressor/adaptor/pytorch_gpu.yaml +81 -0
  112. neural_compressor-2.3/neural_compressor/adaptor/pytorch_ipex.yaml +151 -0
  113. neural_compressor-2.3/neural_compressor/adaptor/query.py +76 -0
  114. neural_compressor-2.3/neural_compressor/adaptor/tensorflow.py +2549 -0
  115. neural_compressor-2.3/neural_compressor/adaptor/tensorflow.yaml +245 -0
  116. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_converter.py +922 -0
  117. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_converter_without_calib.py +365 -0
  118. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/bf16/bf16_convert.py +289 -0
  119. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/convert_add_to_biasadd.py +77 -0
  120. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/convert_layout.py +87 -0
  121. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/convert_leakyrelu.py +78 -0
  122. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/convert_nan_to_random.py +52 -0
  123. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/convert_placeholder_to_const.py +99 -0
  124. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/dequantize_cast_optimizer.py +83 -0
  125. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/dilated_contraction.py +89 -0
  126. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/dummy_biasadd.py +130 -0
  127. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/expanddims_optimizer.py +81 -0
  128. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fetch_weight_from_reshape.py +89 -0
  129. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fold_batch_norm.py +271 -0
  130. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fold_constant.py +182 -0
  131. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fuse_biasadd_add.py +75 -0
  132. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fuse_column_wise_mul.py +86 -0
  133. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fuse_conv_with_math.py +111 -0
  134. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fuse_decomposed_bn.py +400 -0
  135. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fuse_decomposed_in.py +369 -0
  136. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fuse_gelu.py +229 -0
  137. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fuse_layer_norm.py +244 -0
  138. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fuse_pad_with_conv.py +126 -0
  139. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fuse_pad_with_fp32_conv.py +129 -0
  140. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fuse_reshape_transpose.py +126 -0
  141. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/graph_cse_optimizer.py +145 -0
  142. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/grappler_pass.py +71 -0
  143. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/insert_print_node.py +224 -0
  144. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/move_squeeze_after_relu.py +123 -0
  145. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/pre_optimize.py +306 -0
  146. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/remove_training_nodes.py +66 -0
  147. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/rename_batch_norm.py +60 -0
  148. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/split_shared_input.py +60 -0
  149. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/strip_equivalent_nodes.py +50 -0
  150. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/strip_unused_nodes.py +39 -0
  151. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/switch_optimizer.py +85 -0
  152. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/graph_base.py +40 -0
  153. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/freeze_fake_quant.py +149 -0
  154. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/freeze_value.py +396 -0
  155. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/freeze_value_without_calib.py +123 -0
  156. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/fuse_conv_redundant_dequantize.py +150 -0
  157. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/fuse_conv_requantize.py +805 -0
  158. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/fuse_matmul_redundant_dequantize.py +158 -0
  159. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/fuse_matmul_requantize.py +904 -0
  160. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/meta_op_optimizer.py +116 -0
  161. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/post_hostconst_converter.py +53 -0
  162. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/post_quantized_op_cse.py +135 -0
  163. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/rnn_convert.py +296 -0
  164. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/scale_propagation.py +118 -0
  165. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/onnx/onnx_graph.py +1389 -0
  166. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/onnx/onnx_node.py +414 -0
  167. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/onnx/onnx_schema.py +131 -0
  168. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/onnx/tf2onnx_utils.py +655 -0
  169. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/qdq/insert_qdq_pattern.py +730 -0
  170. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/qdq/merge_duplicated_qdq.py +94 -0
  171. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_rewriter/qdq/share_qdq_y_pattern.py +60 -0
  172. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/graph_util.py +1090 -0
  173. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/quantize_graph/qat/fake_quantize.py +231 -0
  174. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/quantize_graph/qat/quantize_config.py +129 -0
  175. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/quantize_graph/qat/quantize_helper.py +92 -0
  176. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/quantize_graph/qat/quantize_layers/optimize_layer.py +32 -0
  177. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/quantize_graph/qat/quantize_layers/quantize_layer_add.py +83 -0
  178. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/quantize_graph/qat/quantize_layers/quantize_layer_base.py +87 -0
  179. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/quantize_graph/qat/quantize_layers/quantize_layer_bn.py +58 -0
  180. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/quantize_graph/qat/quantize_wrapper.py +284 -0
  181. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/quantize_graph/qdq/fuse_qdq_bn.py +303 -0
  182. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/quantize_graph/qdq/fuse_qdq_concatv2.py +261 -0
  183. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/quantize_graph/qdq/fuse_qdq_conv.py +2022 -0
  184. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/quantize_graph/qdq/fuse_qdq_deconv.py +541 -0
  185. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/quantize_graph/qdq/fuse_qdq_in.py +183 -0
  186. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/quantize_graph/qdq/fuse_qdq_matmul.py +1039 -0
  187. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/quantize_graph/qdq/fuse_qdq_pooling.py +137 -0
  188. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/quantize_graph/qdq/optimize_qdq.py +158 -0
  189. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/quantize_graph/quantize_graph_base.py +757 -0
  190. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/quantize_graph/quantize_graph_bn.py +298 -0
  191. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/quantize_graph/quantize_graph_concatv2.py +106 -0
  192. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/quantize_graph/quantize_graph_conv.py +378 -0
  193. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/quantize_graph/quantize_graph_for_intel_cpu.py +130 -0
  194. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/quantize_graph/quantize_graph_matmul.py +351 -0
  195. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/quantize_graph/quantize_graph_pooling.py +73 -0
  196. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/quantize_graph_common.py +448 -0
  197. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/smooth_quant_calibration.py +225 -0
  198. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/smooth_quant_scaler.py +155 -0
  199. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/tf2onnx_converter.py +336 -0
  200. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/transform_graph/bias_correction.py +137 -0
  201. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/transform_graph/graph_transform_base.py +111 -0
  202. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/transform_graph/insert_logging.py +199 -0
  203. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/transform_graph/rerange_quantized_concat.py +313 -0
  204. neural_compressor-2.3/neural_compressor/adaptor/tf_utils/util.py +661 -0
  205. neural_compressor-2.3/neural_compressor/adaptor/torch_utils/awq.py +480 -0
  206. neural_compressor-2.3/neural_compressor/adaptor/torch_utils/bf16_convert.py +93 -0
  207. neural_compressor-2.3/neural_compressor/adaptor/torch_utils/gptq.py +844 -0
  208. neural_compressor-2.3/neural_compressor/adaptor/torch_utils/hawq_metric.py +620 -0
  209. neural_compressor-2.3/neural_compressor/adaptor/torch_utils/layer_wise_quant/__init__.py +19 -0
  210. neural_compressor-2.3/neural_compressor/adaptor/torch_utils/layer_wise_quant/modified_pickle.py +1861 -0
  211. neural_compressor-2.3/neural_compressor/adaptor/torch_utils/layer_wise_quant/quantize.py +280 -0
  212. neural_compressor-2.3/neural_compressor/adaptor/torch_utils/layer_wise_quant/torch_load.py +286 -0
  213. neural_compressor-2.3/neural_compressor/adaptor/torch_utils/layer_wise_quant/utils.py +256 -0
  214. neural_compressor-2.3/neural_compressor/adaptor/torch_utils/mixed_precision.py +45 -0
  215. neural_compressor-2.3/neural_compressor/adaptor/torch_utils/model_wrapper.py +557 -0
  216. neural_compressor-2.3/neural_compressor/adaptor/torch_utils/pattern_detector.py +166 -0
  217. neural_compressor-2.3/neural_compressor/adaptor/torch_utils/smooth_quant.py +1390 -0
  218. neural_compressor-2.3/neural_compressor/adaptor/torch_utils/symbolic_trace.py +77 -0
  219. neural_compressor-2.3/neural_compressor/adaptor/torch_utils/teq.py +309 -0
  220. neural_compressor-2.3/neural_compressor/adaptor/torch_utils/util.py +1273 -0
  221. neural_compressor-2.3/neural_compressor/adaptor/torch_utils/weight_only.py +640 -0
  222. neural_compressor-2.3/neural_compressor/algorithm/__init__.py +30 -0
  223. neural_compressor-2.3/neural_compressor/algorithm/algorithm.py +231 -0
  224. neural_compressor-2.3/neural_compressor/algorithm/fast_bias_correction.py +160 -0
  225. neural_compressor-2.3/neural_compressor/algorithm/smooth_quant.py +90 -0
  226. neural_compressor-2.3/neural_compressor/algorithm/weight_correction.py +148 -0
  227. neural_compressor-2.3/neural_compressor/benchmark.py +543 -0
  228. neural_compressor-2.3/neural_compressor/compression/__init__.py +18 -0
  229. neural_compressor-2.3/neural_compressor/compression/callbacks.py +479 -0
  230. neural_compressor-2.3/neural_compressor/compression/distillation/__init__.py +17 -0
  231. neural_compressor-2.3/neural_compressor/compression/distillation/criterions.py +1509 -0
  232. neural_compressor-2.3/neural_compressor/compression/hpo/__init__.py +21 -0
  233. neural_compressor-2.3/neural_compressor/compression/hpo/sa_optimizer.py +127 -0
  234. neural_compressor-2.3/neural_compressor/compression/hpo/search_algorithms.py +365 -0
  235. neural_compressor-2.3/neural_compressor/compression/hpo/search_space.py +169 -0
  236. neural_compressor-2.3/neural_compressor/compression/pruner/__init__.py +234 -0
  237. neural_compressor-2.3/neural_compressor/compression/pruner/criteria.py +305 -0
  238. neural_compressor-2.3/neural_compressor/compression/pruner/model_slim/__init__.py +19 -0
  239. neural_compressor-2.3/neural_compressor/compression/pruner/model_slim/auto_slim.py +130 -0
  240. neural_compressor-2.3/neural_compressor/compression/pruner/model_slim/pattern_analyzer.py +842 -0
  241. neural_compressor-2.3/neural_compressor/compression/pruner/model_slim/weight_slim.py +394 -0
  242. neural_compressor-2.3/neural_compressor/compression/pruner/patterns/__init__.py +63 -0
  243. neural_compressor-2.3/neural_compressor/compression/pruner/patterns/base.py +718 -0
  244. neural_compressor-2.3/neural_compressor/compression/pruner/patterns/mha.py +58 -0
  245. neural_compressor-2.3/neural_compressor/compression/pruner/patterns/ninm.py +455 -0
  246. neural_compressor-2.3/neural_compressor/compression/pruner/patterns/nxm.py +840 -0
  247. neural_compressor-2.3/neural_compressor/compression/pruner/pruners/__init__.py +90 -0
  248. neural_compressor-2.3/neural_compressor/compression/pruner/pruners/base.py +263 -0
  249. neural_compressor-2.3/neural_compressor/compression/pruner/pruners/basic.py +211 -0
  250. neural_compressor-2.3/neural_compressor/compression/pruner/pruners/block_mask.py +167 -0
  251. neural_compressor-2.3/neural_compressor/compression/pruner/pruners/mha.py +250 -0
  252. neural_compressor-2.3/neural_compressor/compression/pruner/pruners/pattern_lock.py +57 -0
  253. neural_compressor-2.3/neural_compressor/compression/pruner/pruners/progressive.py +272 -0
  254. neural_compressor-2.3/neural_compressor/compression/pruner/pruners/retrain_free.py +197 -0
  255. neural_compressor-2.3/neural_compressor/compression/pruner/pruners/sparse_gpt.py +114 -0
  256. neural_compressor-2.3/neural_compressor/compression/pruner/pruning.py +286 -0
  257. neural_compressor-2.3/neural_compressor/compression/pruner/regs.py +144 -0
  258. neural_compressor-2.3/neural_compressor/compression/pruner/schedulers.py +182 -0
  259. neural_compressor-2.3/neural_compressor/compression/pruner/tf_criteria.py +96 -0
  260. neural_compressor-2.3/neural_compressor/compression/pruner/utils.py +735 -0
  261. neural_compressor-2.3/neural_compressor/conf/__init__.py +16 -0
  262. neural_compressor-2.3/neural_compressor/conf/config.py +1733 -0
  263. neural_compressor-2.3/neural_compressor/conf/dotdict.py +88 -0
  264. neural_compressor-2.3/neural_compressor/conf/pythonic_config.py +1460 -0
  265. neural_compressor-2.3/neural_compressor/config.py +2587 -0
  266. neural_compressor-2.3/neural_compressor/contrib/__init__.py +18 -0
  267. neural_compressor-2.3/neural_compressor/contrib/strategy/__init__.py +25 -0
  268. neural_compressor-2.3/neural_compressor/contrib/strategy/sigopt.py +312 -0
  269. neural_compressor-2.3/neural_compressor/contrib/strategy/tpe.py +547 -0
  270. neural_compressor-2.3/neural_compressor/data/__init__.py +66 -0
  271. neural_compressor-2.3/neural_compressor/data/dataloaders/__init__.py +21 -0
  272. neural_compressor-2.3/neural_compressor/data/dataloaders/base_dataloader.py +141 -0
  273. neural_compressor-2.3/neural_compressor/data/dataloaders/dataloader.py +150 -0
  274. neural_compressor-2.3/neural_compressor/data/dataloaders/default_dataloader.py +170 -0
  275. neural_compressor-2.3/neural_compressor/data/dataloaders/fetcher.py +130 -0
  276. neural_compressor-2.3/neural_compressor/data/dataloaders/mxnet_dataloader.py +57 -0
  277. neural_compressor-2.3/neural_compressor/data/dataloaders/onnxrt_dataloader.py +118 -0
  278. neural_compressor-2.3/neural_compressor/data/dataloaders/pytorch_dataloader.py +82 -0
  279. neural_compressor-2.3/neural_compressor/data/dataloaders/sampler.py +142 -0
  280. neural_compressor-2.3/neural_compressor/data/dataloaders/tensorflow_dataloader.py +404 -0
  281. neural_compressor-2.3/neural_compressor/data/datasets/__init__.py +31 -0
  282. neural_compressor-2.3/neural_compressor/data/datasets/bert_dataset.py +493 -0
  283. neural_compressor-2.3/neural_compressor/data/datasets/coco_dataset.py +339 -0
  284. neural_compressor-2.3/neural_compressor/data/datasets/dataset.py +1151 -0
  285. neural_compressor-2.3/neural_compressor/data/datasets/dummy_dataset.py +160 -0
  286. neural_compressor-2.3/neural_compressor/data/datasets/dummy_dataset_v2.py +308 -0
  287. neural_compressor-2.3/neural_compressor/data/datasets/imagenet_dataset.py +241 -0
  288. neural_compressor-2.3/neural_compressor/data/datasets/style_transfer_dataset.py +95 -0
  289. neural_compressor-2.3/neural_compressor/data/filters/__init__.py +31 -0
  290. neural_compressor-2.3/neural_compressor/data/filters/coco_filter.py +63 -0
  291. neural_compressor-2.3/neural_compressor/data/filters/filter.py +189 -0
  292. neural_compressor-2.3/neural_compressor/data/transforms/__init__.py +62 -0
  293. neural_compressor-2.3/neural_compressor/data/transforms/coco_transform.py +48 -0
  294. neural_compressor-2.3/neural_compressor/data/transforms/imagenet_transform.py +493 -0
  295. neural_compressor-2.3/neural_compressor/data/transforms/postprocess.py +28 -0
  296. neural_compressor-2.3/neural_compressor/data/transforms/tokenization.py +352 -0
  297. neural_compressor-2.3/neural_compressor/data/transforms/transform.py +2859 -0
  298. neural_compressor-2.3/neural_compressor/experimental/__init__.py +43 -0
  299. neural_compressor-2.3/neural_compressor/experimental/benchmark.py +648 -0
  300. neural_compressor-2.3/neural_compressor/experimental/common/__init__.py +26 -0
  301. neural_compressor-2.3/neural_compressor/experimental/common/criterion.py +1622 -0
  302. neural_compressor-2.3/neural_compressor/experimental/common/dataloader.py +118 -0
  303. neural_compressor-2.3/neural_compressor/experimental/common/metric.py +38 -0
  304. neural_compressor-2.3/neural_compressor/experimental/common/model.py +69 -0
  305. neural_compressor-2.3/neural_compressor/experimental/common/optimizer.py +230 -0
  306. neural_compressor-2.3/neural_compressor/experimental/common/postprocess.py +28 -0
  307. neural_compressor-2.3/neural_compressor/experimental/common/torch_utils.py +65 -0
  308. neural_compressor-2.3/neural_compressor/experimental/component.py +546 -0
  309. neural_compressor-2.3/neural_compressor/experimental/compression/__init__.py +17 -0
  310. neural_compressor-2.3/neural_compressor/experimental/contrib/__init__.py +18 -0
  311. neural_compressor-2.3/neural_compressor/experimental/contrib/strategy/__init__.py +24 -0
  312. neural_compressor-2.3/neural_compressor/experimental/contrib/strategy/sigopt.py +275 -0
  313. neural_compressor-2.3/neural_compressor/experimental/contrib/strategy/tpe.py +527 -0
  314. neural_compressor-2.3/neural_compressor/experimental/data/__init__.py +38 -0
  315. neural_compressor-2.3/neural_compressor/experimental/data/dataloaders/base_dataloader.py +141 -0
  316. neural_compressor-2.3/neural_compressor/experimental/data/dataloaders/dataloader.py +38 -0
  317. neural_compressor-2.3/neural_compressor/experimental/data/dataloaders/default_dataloader.py +170 -0
  318. neural_compressor-2.3/neural_compressor/experimental/data/dataloaders/fetcher.py +130 -0
  319. neural_compressor-2.3/neural_compressor/experimental/data/dataloaders/mxnet_dataloader.py +57 -0
  320. neural_compressor-2.3/neural_compressor/experimental/data/dataloaders/onnxrt_dataloader.py +118 -0
  321. neural_compressor-2.3/neural_compressor/experimental/data/dataloaders/pytorch_dataloader.py +82 -0
  322. neural_compressor-2.3/neural_compressor/experimental/data/dataloaders/sampler.py +142 -0
  323. neural_compressor-2.3/neural_compressor/experimental/data/dataloaders/tensorflow_dataloader.py +404 -0
  324. neural_compressor-2.3/neural_compressor/experimental/data/datasets/__init__.py +30 -0
  325. neural_compressor-2.3/neural_compressor/experimental/data/datasets/bert_dataset.py +491 -0
  326. neural_compressor-2.3/neural_compressor/experimental/data/datasets/coco_dataset.py +339 -0
  327. neural_compressor-2.3/neural_compressor/experimental/data/datasets/dataset.py +1151 -0
  328. neural_compressor-2.3/neural_compressor/experimental/data/datasets/dummy_dataset.py +160 -0
  329. neural_compressor-2.3/neural_compressor/experimental/data/datasets/dummy_dataset_v2.py +308 -0
  330. neural_compressor-2.3/neural_compressor/experimental/data/datasets/imagenet_dataset.py +241 -0
  331. neural_compressor-2.3/neural_compressor/experimental/data/datasets/style_transfer_dataset.py +95 -0
  332. neural_compressor-2.3/neural_compressor/experimental/data/filters/__init__.py +30 -0
  333. neural_compressor-2.3/neural_compressor/experimental/data/filters/coco_filter.py +63 -0
  334. neural_compressor-2.3/neural_compressor/experimental/data/filters/filter.py +189 -0
  335. neural_compressor-2.3/neural_compressor/experimental/data/transforms/__init__.py +31 -0
  336. neural_compressor-2.3/neural_compressor/experimental/data/transforms/imagenet_transform.py +464 -0
  337. neural_compressor-2.3/neural_compressor/experimental/data/transforms/tokenization.py +352 -0
  338. neural_compressor-2.3/neural_compressor/experimental/data/transforms/transform.py +2865 -0
  339. neural_compressor-2.3/neural_compressor/experimental/distillation.py +509 -0
  340. neural_compressor-2.3/neural_compressor/experimental/export/__init__.py +21 -0
  341. neural_compressor-2.3/neural_compressor/experimental/export/qlinear2qdq.py +83 -0
  342. neural_compressor-2.3/neural_compressor/experimental/export/tf2onnx.py +118 -0
  343. neural_compressor-2.3/neural_compressor/experimental/export/torch2onnx.py +426 -0
  344. neural_compressor-2.3/neural_compressor/experimental/graph_optimization.py +445 -0
  345. neural_compressor-2.3/neural_compressor/experimental/metric/__init__.py +30 -0
  346. neural_compressor-2.3/neural_compressor/experimental/metric/bleu.py +143 -0
  347. neural_compressor-2.3/neural_compressor/experimental/metric/bleu_util.py +137 -0
  348. neural_compressor-2.3/neural_compressor/experimental/metric/coco_label_map.py +102 -0
  349. neural_compressor-2.3/neural_compressor/experimental/metric/coco_tools.py +694 -0
  350. neural_compressor-2.3/neural_compressor/experimental/metric/evaluate_squad.py +117 -0
  351. neural_compressor-2.3/neural_compressor/experimental/metric/f1.py +149 -0
  352. neural_compressor-2.3/neural_compressor/experimental/metric/metric.py +1601 -0
  353. neural_compressor-2.3/neural_compressor/experimental/mixed_precision.py +230 -0
  354. neural_compressor-2.3/neural_compressor/experimental/model_conversion.py +365 -0
  355. neural_compressor-2.3/neural_compressor/experimental/nas/basic_nas.py +140 -0
  356. neural_compressor-2.3/neural_compressor/experimental/nas/dynas.py +110 -0
  357. neural_compressor-2.3/neural_compressor/experimental/nas/nas.py +350 -0
  358. neural_compressor-2.3/neural_compressor/experimental/nas/nas_utils.py +86 -0
  359. neural_compressor-2.3/neural_compressor/experimental/nas/search_algorithms.py +168 -0
  360. neural_compressor-2.3/neural_compressor/experimental/pruner_legacy/__init__.py +29 -0
  361. neural_compressor-2.3/neural_compressor/experimental/pruner_legacy/gradient_sensitivity.py +231 -0
  362. neural_compressor-2.3/neural_compressor/experimental/pruner_legacy/group_lasso.py +69 -0
  363. neural_compressor-2.3/neural_compressor/experimental/pruner_legacy/magnitude.py +105 -0
  364. neural_compressor-2.3/neural_compressor/experimental/pruner_legacy/pattern_lock.py +64 -0
  365. neural_compressor-2.3/neural_compressor/experimental/pruner_legacy/pruner.py +137 -0
  366. neural_compressor-2.3/neural_compressor/experimental/pruning.py +501 -0
  367. neural_compressor-2.3/neural_compressor/experimental/pruning_recipes/__init__.py +25 -0
  368. neural_compressor-2.3/neural_compressor/experimental/pruning_recipes/patterns/__init__.py +30 -0
  369. neural_compressor-2.3/neural_compressor/experimental/pruning_recipes/patterns/pattern.py +110 -0
  370. neural_compressor-2.3/neural_compressor/experimental/pruning_recipes/patterns/tile_pattern.py +87 -0
  371. neural_compressor-2.3/neural_compressor/experimental/pruning_v2.py +524 -0
  372. neural_compressor-2.3/neural_compressor/experimental/pytorch_pruner/logger.py +19 -0
  373. neural_compressor-2.3/neural_compressor/experimental/pytorch_pruner/patterns.py +581 -0
  374. neural_compressor-2.3/neural_compressor/experimental/pytorch_pruner/prune_utils.py +223 -0
  375. neural_compressor-2.3/neural_compressor/experimental/pytorch_pruner/pruner.py +347 -0
  376. neural_compressor-2.3/neural_compressor/experimental/pytorch_pruner/pruning.py +166 -0
  377. neural_compressor-2.3/neural_compressor/experimental/pytorch_pruner/scheduler.py +164 -0
  378. neural_compressor-2.3/neural_compressor/experimental/quantization.py +484 -0
  379. neural_compressor-2.3/neural_compressor/experimental/scheduler.py +391 -0
  380. neural_compressor-2.3/neural_compressor/experimental/strategy/__init__.py +29 -0
  381. neural_compressor-2.3/neural_compressor/experimental/strategy/auto_mixed_precision.py +167 -0
  382. neural_compressor-2.3/neural_compressor/experimental/strategy/basic.py +185 -0
  383. neural_compressor-2.3/neural_compressor/experimental/strategy/bayesian.py +426 -0
  384. neural_compressor-2.3/neural_compressor/experimental/strategy/exhaustive.py +47 -0
  385. neural_compressor-2.3/neural_compressor/experimental/strategy/mse.py +225 -0
  386. neural_compressor-2.3/neural_compressor/experimental/strategy/mse_v2.py +227 -0
  387. neural_compressor-2.3/neural_compressor/experimental/strategy/random.py +56 -0
  388. neural_compressor-2.3/neural_compressor/experimental/strategy/strategy.py +1396 -0
  389. neural_compressor-2.3/neural_compressor/experimental/strategy/utils/constant.py +47 -0
  390. neural_compressor-2.3/neural_compressor/experimental/strategy/utils/tuning_sampler.py +485 -0
  391. neural_compressor-2.3/neural_compressor/experimental/strategy/utils/tuning_space.py +725 -0
  392. neural_compressor-2.3/neural_compressor/experimental/strategy/utils/tuning_structs.py +106 -0
  393. neural_compressor-2.3/neural_compressor/experimental/strategy/utils/utility.py +60 -0
  394. neural_compressor-2.3/neural_compressor/metric/__init__.py +50 -0
  395. neural_compressor-2.3/neural_compressor/metric/bleu.py +143 -0
  396. neural_compressor-2.3/neural_compressor/metric/bleu_util.py +137 -0
  397. neural_compressor-2.3/neural_compressor/metric/coco_label_map.py +102 -0
  398. neural_compressor-2.3/neural_compressor/metric/coco_tools.py +694 -0
  399. neural_compressor-2.3/neural_compressor/metric/evaluate_squad.py +117 -0
  400. neural_compressor-2.3/neural_compressor/metric/f1.py +149 -0
  401. neural_compressor-2.3/neural_compressor/metric/metric.py +1684 -0
  402. neural_compressor-2.3/neural_compressor/mix_precision.py +179 -0
  403. neural_compressor-2.3/neural_compressor/model/__init__.py +22 -0
  404. neural_compressor-2.3/neural_compressor/model/base_model.py +64 -0
  405. neural_compressor-2.3/neural_compressor/model/keras_model.py +151 -0
  406. neural_compressor-2.3/neural_compressor/model/model.py +260 -0
  407. neural_compressor-2.3/neural_compressor/model/mxnet_model.py +76 -0
  408. neural_compressor-2.3/neural_compressor/model/nets_factory.py +161 -0
  409. neural_compressor-2.3/neural_compressor/model/onnx_model.py +914 -0
  410. neural_compressor-2.3/neural_compressor/model/tensorflow_model.py +1204 -0
  411. neural_compressor-2.3/neural_compressor/model/torch_model.py +593 -0
  412. neural_compressor-2.3/neural_compressor/objective.py +602 -0
  413. neural_compressor-2.3/neural_compressor/profiling/parser/factory.py +49 -0
  414. neural_compressor-2.3/neural_compressor/profiling/parser/onnx_parser/factory.py +41 -0
  415. neural_compressor-2.3/neural_compressor/profiling/parser/onnx_parser/parser.py +73 -0
  416. neural_compressor-2.3/neural_compressor/profiling/parser/parser.py +77 -0
  417. neural_compressor-2.3/neural_compressor/profiling/parser/result.py +64 -0
  418. neural_compressor-2.3/neural_compressor/profiling/parser/tensorflow_parser/factory.py +41 -0
  419. neural_compressor-2.3/neural_compressor/profiling/parser/tensorflow_parser/parser.py +107 -0
  420. neural_compressor-2.3/neural_compressor/profiling/profiler/factory.py +54 -0
  421. neural_compressor-2.3/neural_compressor/profiling/profiler/onnxrt_profiler/factory.py +45 -0
  422. neural_compressor-2.3/neural_compressor/profiling/profiler/onnxrt_profiler/profiler.py +89 -0
  423. neural_compressor-2.3/neural_compressor/profiling/profiler/tensorflow_profiler/factory.py +53 -0
  424. neural_compressor-2.3/neural_compressor/profiling/profiler/tensorflow_profiler/profiler.py +132 -0
  425. neural_compressor-2.3/neural_compressor/profiling/profiler/tensorflow_profiler/utils.py +85 -0
  426. neural_compressor-2.3/neural_compressor/quantization.py +252 -0
  427. neural_compressor-2.3/neural_compressor/strategy/__init__.py +29 -0
  428. neural_compressor-2.3/neural_compressor/strategy/auto.py +145 -0
  429. neural_compressor-2.3/neural_compressor/strategy/auto_mixed_precision.py +262 -0
  430. neural_compressor-2.3/neural_compressor/strategy/basic.py +432 -0
  431. neural_compressor-2.3/neural_compressor/strategy/bayesian.py +460 -0
  432. neural_compressor-2.3/neural_compressor/strategy/conservative.py +234 -0
  433. neural_compressor-2.3/neural_compressor/strategy/exhaustive.py +46 -0
  434. neural_compressor-2.3/neural_compressor/strategy/hawq_v2.py +120 -0
  435. neural_compressor-2.3/neural_compressor/strategy/mse.py +256 -0
  436. neural_compressor-2.3/neural_compressor/strategy/mse_v2.py +205 -0
  437. neural_compressor-2.3/neural_compressor/strategy/random.py +53 -0
  438. neural_compressor-2.3/neural_compressor/strategy/strategy.py +2105 -0
  439. neural_compressor-2.3/neural_compressor/strategy/utils/constant.py +58 -0
  440. neural_compressor-2.3/neural_compressor/strategy/utils/tuning_sampler.py +611 -0
  441. neural_compressor-2.3/neural_compressor/strategy/utils/tuning_space.py +793 -0
  442. neural_compressor-2.3/neural_compressor/strategy/utils/tuning_structs.py +112 -0
  443. neural_compressor-2.3/neural_compressor/strategy/utils/utility.py +172 -0
  444. neural_compressor-2.3/neural_compressor/training.py +480 -0
  445. neural_compressor-2.3/neural_compressor/utils/__init__.py +35 -0
  446. neural_compressor-2.3/neural_compressor/utils/collect_layer_histogram.py +67 -0
  447. neural_compressor-2.3/neural_compressor/utils/constant.py +86 -0
  448. neural_compressor-2.3/neural_compressor/utils/create_obj_from_config.py +236 -0
  449. neural_compressor-2.3/neural_compressor/utils/kl_divergence.py +140 -0
  450. neural_compressor-2.3/neural_compressor/utils/load_huggingface.py +232 -0
  451. neural_compressor-2.3/neural_compressor/utils/logger.py +132 -0
  452. neural_compressor-2.3/neural_compressor/utils/neural_insights_utils.py +174 -0
  453. neural_compressor-2.3/neural_compressor/utils/options.py +42 -0
  454. neural_compressor-2.3/neural_compressor/utils/pytorch.py +453 -0
  455. neural_compressor-2.3/neural_compressor/utils/utility.py +1094 -0
  456. neural_compressor-2.3/neural_compressor/utils/weights_details.py +78 -0
  457. neural_compressor-2.3/neural_compressor/version.py +18 -0
  458. neural_compressor-2.3/neural_compressor.egg-info/PKG-INFO +191 -0
  459. neural_compressor-2.3/neural_compressor.egg-info/SOURCES.txt +531 -0
  460. neural_compressor-2.3/neural_compressor.egg-info/requires.txt +18 -0
  461. neural_compressor-2.3/pyproject.toml +125 -0
  462. neural_compressor-2.3/setup.py +105 -0
  463. neural_compressor-2.2/PKG-INFO +0 -173
  464. neural_compressor-2.2/README.md +0 -156
  465. neural_compressor-2.2/neural_coder/__init__.py +0 -19
  466. neural_compressor-2.2/neural_coder/backends/nano_bf16.yaml +0 -27
  467. neural_compressor-2.2/neural_coder/backends/nano_bf16_channels_last.yaml +0 -27
  468. neural_compressor-2.2/neural_coder/backends/nano_bf16_ipex.yaml +0 -27
  469. neural_compressor-2.2/neural_coder/backends/nano_bf16_ipex_channels_last.yaml +0 -27
  470. neural_compressor-2.2/neural_coder/backends/nano_fp32_channels_last.yaml +0 -27
  471. neural_compressor-2.2/neural_coder/backends/nano_fp32_ipex.yaml +0 -27
  472. neural_compressor-2.2/neural_coder/backends/nano_fp32_ipex_channels_last.yaml +0 -27
  473. neural_compressor-2.2/neural_coder/backends/nano_gpu_to_cpu.yaml +0 -24
  474. neural_compressor-2.2/neural_coder/backends/nano_int8.yaml +0 -27
  475. neural_compressor-2.2/neural_coder/backends/nano_jit_bf16.yaml +0 -27
  476. neural_compressor-2.2/neural_coder/backends/nano_jit_bf16_channels_last.yaml +0 -27
  477. neural_compressor-2.2/neural_coder/backends/nano_jit_bf16_ipex.yaml +0 -27
  478. neural_compressor-2.2/neural_coder/backends/nano_jit_bf16_ipex_channels_last.yaml +0 -27
  479. neural_compressor-2.2/neural_coder/backends/nano_jit_fp32_channels_last.yaml +0 -27
  480. neural_compressor-2.2/neural_coder/backends/nano_jit_fp32_ipex_channels_last.yaml +0 -27
  481. neural_compressor-2.2/neural_coder/backends/nano_onnxruntime_fp32.yaml +0 -27
  482. neural_compressor-2.2/neural_coder/backends/nano_onnxruntime_int8_qlinear.yaml +0 -27
  483. neural_compressor-2.2/neural_coder/backends/nano_openvino_fp32.yaml +0 -27
  484. neural_compressor-2.2/neural_coder/backends/nano_openvino_int8.yaml +0 -27
  485. neural_compressor-2.2/neural_coder/backends/pytorch_aliblade.yaml +0 -25
  486. neural_compressor-2.2/neural_coder/backends/pytorch_inc_static_quant_fx.yaml +0 -46
  487. neural_compressor-2.2/neural_coder/backends/pytorch_inc_static_quant_fx_fp8.yaml +0 -46
  488. neural_compressor-2.2/neural_coder/backends/pytorch_jit_script.yaml +0 -36
  489. neural_compressor-2.2/neural_coder/backends/pytorch_jit_script_ofi.yaml +0 -35
  490. neural_compressor-2.2/neural_coder/backends/pytorch_mixed_precision_cpu.yaml +0 -28
  491. neural_compressor-2.2/neural_coder/coders/autoinc/autoinc_harness.py +0 -440
  492. neural_compressor-2.2/neural_coder/coders/autoinc/calib_dataloader.py +0 -42
  493. neural_compressor-2.2/neural_coder/coders/autoinc/domain.py +0 -32
  494. neural_compressor-2.2/neural_coder/coders/autoinc/eval_func.py +0 -110
  495. neural_compressor-2.2/neural_coder/coders/pytorch/batch_size.py +0 -84
  496. neural_compressor-2.2/neural_coder/coders/pytorch/change_trainer_to_nlptrainer.py +0 -46
  497. neural_compressor-2.2/neural_coder/coders/pytorch/cuda_to_cpu.py +0 -87
  498. neural_compressor-2.2/neural_coder/coders/pytorch/dummy_dataloader.py +0 -121
  499. neural_compressor-2.2/neural_coder/coders/pytorch/harness.py +0 -396
  500. neural_compressor-2.2/neural_coder/coders/pytorch/lightning.py +0 -85
  501. neural_compressor-2.2/neural_coder/coders/pytorch/reclaim_inference_transformers_trainer.py +0 -75
  502. neural_compressor-2.2/neural_coder/coders/pytorch/reclaim_inputs.py +0 -106
  503. neural_compressor-2.2/neural_coder/coders/tensorflow/amp.py +0 -61
  504. neural_compressor-2.2/neural_coder/coders/tensorflow/inc.py +0 -49
  505. neural_compressor-2.2/neural_coder/coders/transform.py +0 -87
  506. neural_compressor-2.2/neural_coder/globals.py +0 -116
  507. neural_compressor-2.2/neural_coder/graphers/code_line.py +0 -279
  508. neural_compressor-2.2/neural_coder/graphers/function.py +0 -192
  509. neural_compressor-2.2/neural_coder/graphers/model.py +0 -271
  510. neural_compressor-2.2/neural_coder/graphers/preloads/transformers.yaml +0 -2160
  511. neural_compressor-2.2/neural_coder/interface.py +0 -1302
  512. neural_compressor-2.2/neural_coder/launcher.py +0 -101
  513. neural_compressor-2.2/neural_coder/utils/common.py +0 -26
  514. neural_compressor-2.2/neural_coder/utils/cpu_info.py +0 -46
  515. neural_compressor-2.2/neural_coder/utils/device.py +0 -92
  516. neural_compressor-2.2/neural_coder/utils/handle_user_input.py +0 -234
  517. neural_compressor-2.2/neural_coder/utils/line_operation.py +0 -143
  518. neural_compressor-2.2/neural_coder/utils/numa_launcher.py +0 -805
  519. neural_compressor-2.2/neural_coder/utils/pdf_report.py +0 -424
  520. neural_compressor-2.2/neural_compressor/__init__.py +0 -28
  521. neural_compressor-2.2/neural_compressor/adaptor/__init__.py +0 -28
  522. neural_compressor-2.2/neural_compressor/adaptor/adaptor.py +0 -201
  523. neural_compressor-2.2/neural_compressor/adaptor/keras.py +0 -958
  524. neural_compressor-2.2/neural_compressor/adaptor/keras.yaml +0 -121
  525. neural_compressor-2.2/neural_compressor/adaptor/keras_utils/__init__.py +0 -17
  526. neural_compressor-2.2/neural_compressor/adaptor/keras_utils/conv2d.py +0 -76
  527. neural_compressor-2.2/neural_compressor/adaptor/keras_utils/dense.py +0 -72
  528. neural_compressor-2.2/neural_compressor/adaptor/keras_utils/depthwise_conv2d.py +0 -129
  529. neural_compressor-2.2/neural_compressor/adaptor/keras_utils/pool2d.py +0 -64
  530. neural_compressor-2.2/neural_compressor/adaptor/keras_utils/quantizer.py +0 -103
  531. neural_compressor-2.2/neural_compressor/adaptor/keras_utils/separable_conv2d.py +0 -118
  532. neural_compressor-2.2/neural_compressor/adaptor/mxnet.py +0 -498
  533. neural_compressor-2.2/neural_compressor/adaptor/mxnet.yaml +0 -355
  534. neural_compressor-2.2/neural_compressor/adaptor/mxnet_utils/__init__.py +0 -18
  535. neural_compressor-2.2/neural_compressor/adaptor/mxnet_utils/util.py +0 -914
  536. neural_compressor-2.2/neural_compressor/adaptor/onnxrt.py +0 -1615
  537. neural_compressor-2.2/neural_compressor/adaptor/onnxrt.yaml +0 -416
  538. neural_compressor-2.2/neural_compressor/adaptor/onnxrt_cuda.yaml +0 -435
  539. neural_compressor-2.2/neural_compressor/adaptor/onnxrt_trt.yaml +0 -141
  540. neural_compressor-2.2/neural_compressor/adaptor/ox_utils/calibration.py +0 -717
  541. neural_compressor-2.2/neural_compressor/adaptor/ox_utils/calibrator.py +0 -412
  542. neural_compressor-2.2/neural_compressor/adaptor/ox_utils/operators/__init__.py +0 -29
  543. neural_compressor-2.2/neural_compressor/adaptor/ox_utils/operators/activation.py +0 -149
  544. neural_compressor-2.2/neural_compressor/adaptor/ox_utils/operators/argmax.py +0 -49
  545. neural_compressor-2.2/neural_compressor/adaptor/ox_utils/operators/attention.py +0 -129
  546. neural_compressor-2.2/neural_compressor/adaptor/ox_utils/operators/binary_op.py +0 -144
  547. neural_compressor-2.2/neural_compressor/adaptor/ox_utils/operators/concat.py +0 -151
  548. neural_compressor-2.2/neural_compressor/adaptor/ox_utils/operators/conv.py +0 -244
  549. neural_compressor-2.2/neural_compressor/adaptor/ox_utils/operators/direct_q8.py +0 -91
  550. neural_compressor-2.2/neural_compressor/adaptor/ox_utils/operators/embed_layernorm.py +0 -116
  551. neural_compressor-2.2/neural_compressor/adaptor/ox_utils/operators/gather.py +0 -123
  552. neural_compressor-2.2/neural_compressor/adaptor/ox_utils/operators/gavgpool.py +0 -103
  553. neural_compressor-2.2/neural_compressor/adaptor/ox_utils/operators/gemm.py +0 -174
  554. neural_compressor-2.2/neural_compressor/adaptor/ox_utils/operators/lstm.py +0 -132
  555. neural_compressor-2.2/neural_compressor/adaptor/ox_utils/operators/matmul.py +0 -205
  556. neural_compressor-2.2/neural_compressor/adaptor/ox_utils/operators/maxpool.py +0 -85
  557. neural_compressor-2.2/neural_compressor/adaptor/ox_utils/operators/norm.py +0 -45
  558. neural_compressor-2.2/neural_compressor/adaptor/ox_utils/operators/ops.py +0 -128
  559. neural_compressor-2.2/neural_compressor/adaptor/ox_utils/operators/pad.py +0 -111
  560. neural_compressor-2.2/neural_compressor/adaptor/ox_utils/operators/pooling.py +0 -129
  561. neural_compressor-2.2/neural_compressor/adaptor/ox_utils/operators/reduce.py +0 -28
  562. neural_compressor-2.2/neural_compressor/adaptor/ox_utils/operators/resize.py +0 -86
  563. neural_compressor-2.2/neural_compressor/adaptor/ox_utils/operators/split.py +0 -155
  564. neural_compressor-2.2/neural_compressor/adaptor/ox_utils/operators/unary_op.py +0 -27
  565. neural_compressor-2.2/neural_compressor/adaptor/ox_utils/quantizer.py +0 -1187
  566. neural_compressor-2.2/neural_compressor/adaptor/ox_utils/smooth_quant.py +0 -599
  567. neural_compressor-2.2/neural_compressor/adaptor/ox_utils/util.py +0 -521
  568. neural_compressor-2.2/neural_compressor/adaptor/pytorch.py +0 -4522
  569. neural_compressor-2.2/neural_compressor/adaptor/pytorch_cpu.yaml +0 -431
  570. neural_compressor-2.2/neural_compressor/adaptor/pytorch_gpu.yaml +0 -81
  571. neural_compressor-2.2/neural_compressor/adaptor/pytorch_ipex.yaml +0 -154
  572. neural_compressor-2.2/neural_compressor/adaptor/query.py +0 -75
  573. neural_compressor-2.2/neural_compressor/adaptor/tensorflow.py +0 -2371
  574. neural_compressor-2.2/neural_compressor/adaptor/tensorflow.yaml +0 -246
  575. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_converter.py +0 -903
  576. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_converter_without_calib.py +0 -366
  577. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/bf16/bf16_convert.py +0 -278
  578. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/convert_add_to_biasadd.py +0 -75
  579. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/convert_layout.py +0 -85
  580. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/convert_leakyrelu.py +0 -77
  581. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/convert_nan_to_random.py +0 -47
  582. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/convert_placeholder_to_const.py +0 -94
  583. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/dequantize_cast_optimizer.py +0 -81
  584. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/dilated_contraction.py +0 -90
  585. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/dummy_biasadd.py +0 -108
  586. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/expanddims_optimizer.py +0 -77
  587. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fetch_weight_from_reshape.py +0 -84
  588. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fold_batch_norm.py +0 -267
  589. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fold_constant.py +0 -179
  590. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fuse_biasadd_add.py +0 -76
  591. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fuse_column_wise_mul.py +0 -79
  592. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fuse_conv_with_math.py +0 -112
  593. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fuse_decomposed_bn.py +0 -406
  594. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fuse_decomposed_in.py +0 -368
  595. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fuse_gelu.py +0 -227
  596. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fuse_layer_norm.py +0 -244
  597. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fuse_pad_with_conv.py +0 -123
  598. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fuse_pad_with_fp32_conv.py +0 -127
  599. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fuse_reshape_transpose.py +0 -124
  600. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/graph_cse_optimizer.py +0 -145
  601. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/grappler_pass.py +0 -72
  602. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/insert_print_node.py +0 -217
  603. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/move_squeeze_after_relu.py +0 -114
  604. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/pre_optimize.py +0 -307
  605. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/remove_training_nodes.py +0 -71
  606. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/rename_batch_norm.py +0 -59
  607. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/split_shared_input.py +0 -60
  608. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/strip_equivalent_nodes.py +0 -50
  609. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/strip_unused_nodes.py +0 -39
  610. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/switch_optimizer.py +0 -81
  611. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/graph_base.py +0 -39
  612. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/freeze_fake_quant.py +0 -160
  613. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/freeze_value.py +0 -399
  614. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/freeze_value_without_calib.py +0 -133
  615. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/fuse_conv_redundant_dequantize.py +0 -140
  616. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/fuse_conv_requantize.py +0 -635
  617. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/fuse_matmul_redundant_dequantize.py +0 -152
  618. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/fuse_matmul_requantize.py +0 -748
  619. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/meta_op_optimizer.py +0 -113
  620. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/post_hostconst_converter.py +0 -42
  621. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/post_quantized_op_cse.py +0 -133
  622. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/rnn_convert.py +0 -338
  623. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/scale_propagation.py +0 -109
  624. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/onnx/onnx_graph.py +0 -1312
  625. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/onnx/onnx_node.py +0 -415
  626. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/onnx/onnx_schema.py +0 -129
  627. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/onnx/tf2onnx_utils.py +0 -562
  628. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/qdq/insert_qdq_pattern.py +0 -672
  629. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/qdq/merge_duplicated_qdq.py +0 -94
  630. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_rewriter/qdq/share_qdq_y_pattern.py +0 -56
  631. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/graph_util.py +0 -1000
  632. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/quantize_graph/qat/fake_quantize.py +0 -238
  633. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/quantize_graph/qat/quantize_config.py +0 -121
  634. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/quantize_graph/qat/quantize_helper.py +0 -86
  635. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/quantize_graph/qat/quantize_layers/optimize_layer.py +0 -34
  636. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/quantize_graph/qat/quantize_layers/quantize_layer_add.py +0 -81
  637. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/quantize_graph/qat/quantize_layers/quantize_layer_base.py +0 -86
  638. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/quantize_graph/qat/quantize_layers/quantize_layer_bn.py +0 -57
  639. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/quantize_graph/qat/quantize_wrapper.py +0 -282
  640. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/quantize_graph/qdq/fuse_qdq_bn.py +0 -289
  641. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/quantize_graph/qdq/fuse_qdq_concatv2.py +0 -258
  642. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/quantize_graph/qdq/fuse_qdq_conv.py +0 -1936
  643. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/quantize_graph/qdq/fuse_qdq_deconv.py +0 -526
  644. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/quantize_graph/qdq/fuse_qdq_in.py +0 -178
  645. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/quantize_graph/qdq/fuse_qdq_matmul.py +0 -1033
  646. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/quantize_graph/qdq/fuse_qdq_pooling.py +0 -132
  647. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/quantize_graph/qdq/optimize_qdq.py +0 -141
  648. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/quantize_graph/quantize_graph_base.py +0 -786
  649. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/quantize_graph/quantize_graph_bn.py +0 -284
  650. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/quantize_graph/quantize_graph_concatv2.py +0 -105
  651. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/quantize_graph/quantize_graph_conv.py +0 -395
  652. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/quantize_graph/quantize_graph_for_intel_cpu.py +0 -111
  653. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/quantize_graph/quantize_graph_matmul.py +0 -349
  654. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/quantize_graph/quantize_graph_pooling.py +0 -69
  655. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/quantize_graph_common.py +0 -446
  656. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/smooth_quant_calibration.py +0 -213
  657. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/smooth_quant_scaler.py +0 -148
  658. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/tf2onnx_converter.py +0 -328
  659. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/transform_graph/bias_correction.py +0 -144
  660. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/transform_graph/graph_transform_base.py +0 -110
  661. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/transform_graph/insert_logging.py +0 -221
  662. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/transform_graph/rerange_quantized_concat.py +0 -313
  663. neural_compressor-2.2/neural_compressor/adaptor/tf_utils/util.py +0 -620
  664. neural_compressor-2.2/neural_compressor/adaptor/torch_utils/bf16_convert.py +0 -89
  665. neural_compressor-2.2/neural_compressor/adaptor/torch_utils/hawq_metric.py +0 -622
  666. neural_compressor-2.2/neural_compressor/adaptor/torch_utils/mixed_precision.py +0 -43
  667. neural_compressor-2.2/neural_compressor/adaptor/torch_utils/model_wrapper.py +0 -148
  668. neural_compressor-2.2/neural_compressor/adaptor/torch_utils/pattern_detector.py +0 -164
  669. neural_compressor-2.2/neural_compressor/adaptor/torch_utils/smooth_quant.py +0 -1005
  670. neural_compressor-2.2/neural_compressor/adaptor/torch_utils/symbolic_trace.py +0 -78
  671. neural_compressor-2.2/neural_compressor/adaptor/torch_utils/util.py +0 -918
  672. neural_compressor-2.2/neural_compressor/algorithm/__init__.py +0 -32
  673. neural_compressor-2.2/neural_compressor/algorithm/algorithm.py +0 -231
  674. neural_compressor-2.2/neural_compressor/algorithm/fast_bias_correction.py +0 -150
  675. neural_compressor-2.2/neural_compressor/algorithm/smooth_quant.py +0 -90
  676. neural_compressor-2.2/neural_compressor/algorithm/weight_correction.py +0 -138
  677. neural_compressor-2.2/neural_compressor/benchmark.py +0 -545
  678. neural_compressor-2.2/neural_compressor/compression/__init__.py +0 -18
  679. neural_compressor-2.2/neural_compressor/compression/callbacks.py +0 -482
  680. neural_compressor-2.2/neural_compressor/compression/distillation/__init__.py +0 -17
  681. neural_compressor-2.2/neural_compressor/compression/distillation/criterions.py +0 -1449
  682. neural_compressor-2.2/neural_compressor/compression/pruner/__init__.py +0 -21
  683. neural_compressor-2.2/neural_compressor/compression/pruner/criteria.py +0 -292
  684. neural_compressor-2.2/neural_compressor/compression/pruner/model_slim/__init__.py +0 -19
  685. neural_compressor-2.2/neural_compressor/compression/pruner/model_slim/auto_slim.py +0 -132
  686. neural_compressor-2.2/neural_compressor/compression/pruner/model_slim/pattern_analyzer.py +0 -836
  687. neural_compressor-2.2/neural_compressor/compression/pruner/model_slim/weight_slim.py +0 -396
  688. neural_compressor-2.2/neural_compressor/compression/pruner/patterns.py +0 -1554
  689. neural_compressor-2.2/neural_compressor/compression/pruner/pruners.py +0 -1155
  690. neural_compressor-2.2/neural_compressor/compression/pruner/regs.py +0 -144
  691. neural_compressor-2.2/neural_compressor/compression/pruner/schedulers.py +0 -176
  692. neural_compressor-2.2/neural_compressor/compression/pruner/utils.py +0 -585
  693. neural_compressor-2.2/neural_compressor/conf/__init__.py +0 -17
  694. neural_compressor-2.2/neural_compressor/conf/config.py +0 -1738
  695. neural_compressor-2.2/neural_compressor/conf/dotdict.py +0 -92
  696. neural_compressor-2.2/neural_compressor/conf/pythonic_config.py +0 -1460
  697. neural_compressor-2.2/neural_compressor/config.py +0 -2307
  698. neural_compressor-2.2/neural_compressor/contrib/__init__.py +0 -19
  699. neural_compressor-2.2/neural_compressor/contrib/strategy/__init__.py +0 -27
  700. neural_compressor-2.2/neural_compressor/contrib/strategy/sigopt.py +0 -295
  701. neural_compressor-2.2/neural_compressor/contrib/strategy/tpe.py +0 -528
  702. neural_compressor-2.2/neural_compressor/data/__init__.py +0 -64
  703. neural_compressor-2.2/neural_compressor/data/dataloaders/__init__.py +0 -24
  704. neural_compressor-2.2/neural_compressor/data/dataloaders/base_dataloader.py +0 -119
  705. neural_compressor-2.2/neural_compressor/data/dataloaders/dataloader.py +0 -123
  706. neural_compressor-2.2/neural_compressor/data/dataloaders/default_dataloader.py +0 -143
  707. neural_compressor-2.2/neural_compressor/data/dataloaders/fetcher.py +0 -124
  708. neural_compressor-2.2/neural_compressor/data/dataloaders/mxnet_dataloader.py +0 -42
  709. neural_compressor-2.2/neural_compressor/data/dataloaders/onnxrt_dataloader.py +0 -82
  710. neural_compressor-2.2/neural_compressor/data/dataloaders/pytorch_dataloader.py +0 -69
  711. neural_compressor-2.2/neural_compressor/data/dataloaders/sampler.py +0 -136
  712. neural_compressor-2.2/neural_compressor/data/dataloaders/tensorflow_dataloader.py +0 -321
  713. neural_compressor-2.2/neural_compressor/data/datasets/__init__.py +0 -33
  714. neural_compressor-2.2/neural_compressor/data/datasets/bert_dataset.py +0 -469
  715. neural_compressor-2.2/neural_compressor/data/datasets/coco_dataset.py +0 -301
  716. neural_compressor-2.2/neural_compressor/data/datasets/dataset.py +0 -1114
  717. neural_compressor-2.2/neural_compressor/data/datasets/dummy_dataset.py +0 -143
  718. neural_compressor-2.2/neural_compressor/data/datasets/dummy_dataset_v2.py +0 -275
  719. neural_compressor-2.2/neural_compressor/data/datasets/imagenet_dataset.py +0 -219
  720. neural_compressor-2.2/neural_compressor/data/datasets/style_transfer_dataset.py +0 -84
  721. neural_compressor-2.2/neural_compressor/data/filters/__init__.py +0 -32
  722. neural_compressor-2.2/neural_compressor/data/filters/coco_filter.py +0 -60
  723. neural_compressor-2.2/neural_compressor/data/filters/filter.py +0 -177
  724. neural_compressor-2.2/neural_compressor/data/transforms/__init__.py +0 -39
  725. neural_compressor-2.2/neural_compressor/data/transforms/coco_transform.py +0 -46
  726. neural_compressor-2.2/neural_compressor/data/transforms/imagenet_transform.py +0 -421
  727. neural_compressor-2.2/neural_compressor/data/transforms/postprocess.py +0 -27
  728. neural_compressor-2.2/neural_compressor/data/transforms/tokenization.py +0 -342
  729. neural_compressor-2.2/neural_compressor/data/transforms/transform.py +0 -2731
  730. neural_compressor-2.2/neural_compressor/experimental/__init__.py +0 -35
  731. neural_compressor-2.2/neural_compressor/experimental/benchmark.py +0 -614
  732. neural_compressor-2.2/neural_compressor/experimental/common/__init__.py +0 -28
  733. neural_compressor-2.2/neural_compressor/experimental/common/criterion.py +0 -1551
  734. neural_compressor-2.2/neural_compressor/experimental/common/dataloader.py +0 -105
  735. neural_compressor-2.2/neural_compressor/experimental/common/metric.py +0 -38
  736. neural_compressor-2.2/neural_compressor/experimental/common/model.py +0 -68
  737. neural_compressor-2.2/neural_compressor/experimental/common/optimizer.py +0 -214
  738. neural_compressor-2.2/neural_compressor/experimental/common/postprocess.py +0 -27
  739. neural_compressor-2.2/neural_compressor/experimental/common/torch_utils.py +0 -62
  740. neural_compressor-2.2/neural_compressor/experimental/component.py +0 -531
  741. neural_compressor-2.2/neural_compressor/experimental/compression/__init__.py +0 -18
  742. neural_compressor-2.2/neural_compressor/experimental/compression/pruning.py +0 -184
  743. neural_compressor-2.2/neural_compressor/experimental/contrib/__init__.py +0 -19
  744. neural_compressor-2.2/neural_compressor/experimental/contrib/strategy/__init__.py +0 -26
  745. neural_compressor-2.2/neural_compressor/experimental/contrib/strategy/sigopt.py +0 -269
  746. neural_compressor-2.2/neural_compressor/experimental/contrib/strategy/tpe.py +0 -513
  747. neural_compressor-2.2/neural_compressor/experimental/data/__init__.py +0 -37
  748. neural_compressor-2.2/neural_compressor/experimental/data/dataloaders/base_dataloader.py +0 -119
  749. neural_compressor-2.2/neural_compressor/experimental/data/dataloaders/dataloader.py +0 -38
  750. neural_compressor-2.2/neural_compressor/experimental/data/dataloaders/default_dataloader.py +0 -143
  751. neural_compressor-2.2/neural_compressor/experimental/data/dataloaders/fetcher.py +0 -124
  752. neural_compressor-2.2/neural_compressor/experimental/data/dataloaders/mxnet_dataloader.py +0 -42
  753. neural_compressor-2.2/neural_compressor/experimental/data/dataloaders/onnxrt_dataloader.py +0 -82
  754. neural_compressor-2.2/neural_compressor/experimental/data/dataloaders/pytorch_dataloader.py +0 -69
  755. neural_compressor-2.2/neural_compressor/experimental/data/dataloaders/sampler.py +0 -136
  756. neural_compressor-2.2/neural_compressor/experimental/data/dataloaders/tensorflow_dataloader.py +0 -322
  757. neural_compressor-2.2/neural_compressor/experimental/data/datasets/__init__.py +0 -31
  758. neural_compressor-2.2/neural_compressor/experimental/data/datasets/bert_dataset.py +0 -469
  759. neural_compressor-2.2/neural_compressor/experimental/data/datasets/coco_dataset.py +0 -301
  760. neural_compressor-2.2/neural_compressor/experimental/data/datasets/dataset.py +0 -1114
  761. neural_compressor-2.2/neural_compressor/experimental/data/datasets/dummy_dataset.py +0 -143
  762. neural_compressor-2.2/neural_compressor/experimental/data/datasets/dummy_dataset_v2.py +0 -275
  763. neural_compressor-2.2/neural_compressor/experimental/data/datasets/imagenet_dataset.py +0 -219
  764. neural_compressor-2.2/neural_compressor/experimental/data/datasets/style_transfer_dataset.py +0 -84
  765. neural_compressor-2.2/neural_compressor/experimental/data/filters/__init__.py +0 -31
  766. neural_compressor-2.2/neural_compressor/experimental/data/filters/coco_filter.py +0 -60
  767. neural_compressor-2.2/neural_compressor/experimental/data/filters/filter.py +0 -177
  768. neural_compressor-2.2/neural_compressor/experimental/data/transforms/__init__.py +0 -31
  769. neural_compressor-2.2/neural_compressor/experimental/data/transforms/imagenet_transform.py +0 -421
  770. neural_compressor-2.2/neural_compressor/experimental/data/transforms/tokenization.py +0 -342
  771. neural_compressor-2.2/neural_compressor/experimental/data/transforms/transform.py +0 -2729
  772. neural_compressor-2.2/neural_compressor/experimental/distillation.py +0 -503
  773. neural_compressor-2.2/neural_compressor/experimental/export/__init__.py +0 -23
  774. neural_compressor-2.2/neural_compressor/experimental/export/qlinear2qdq.py +0 -85
  775. neural_compressor-2.2/neural_compressor/experimental/export/tf2onnx.py +0 -117
  776. neural_compressor-2.2/neural_compressor/experimental/export/torch2onnx.py +0 -195
  777. neural_compressor-2.2/neural_compressor/experimental/graph_optimization.py +0 -429
  778. neural_compressor-2.2/neural_compressor/experimental/metric/__init__.py +0 -32
  779. neural_compressor-2.2/neural_compressor/experimental/metric/bleu.py +0 -139
  780. neural_compressor-2.2/neural_compressor/experimental/metric/bleu_util.py +0 -139
  781. neural_compressor-2.2/neural_compressor/experimental/metric/coco_label_map.py +0 -103
  782. neural_compressor-2.2/neural_compressor/experimental/metric/coco_tools.py +0 -713
  783. neural_compressor-2.2/neural_compressor/experimental/metric/evaluate_squad.py +0 -120
  784. neural_compressor-2.2/neural_compressor/experimental/metric/f1.py +0 -144
  785. neural_compressor-2.2/neural_compressor/experimental/metric/metric.py +0 -1595
  786. neural_compressor-2.2/neural_compressor/experimental/mixed_precision.py +0 -226
  787. neural_compressor-2.2/neural_compressor/experimental/model_conversion.py +0 -354
  788. neural_compressor-2.2/neural_compressor/experimental/nas/basic_nas.py +0 -141
  789. neural_compressor-2.2/neural_compressor/experimental/nas/dynas.py +0 -110
  790. neural_compressor-2.2/neural_compressor/experimental/nas/nas.py +0 -387
  791. neural_compressor-2.2/neural_compressor/experimental/nas/nas_utils.py +0 -86
  792. neural_compressor-2.2/neural_compressor/experimental/nas/search_algorithms.py +0 -167
  793. neural_compressor-2.2/neural_compressor/experimental/pruner_legacy/__init__.py +0 -30
  794. neural_compressor-2.2/neural_compressor/experimental/pruner_legacy/gradient_sensitivity.py +0 -244
  795. neural_compressor-2.2/neural_compressor/experimental/pruner_legacy/group_lasso.py +0 -66
  796. neural_compressor-2.2/neural_compressor/experimental/pruner_legacy/magnitude.py +0 -106
  797. neural_compressor-2.2/neural_compressor/experimental/pruner_legacy/pattern_lock.py +0 -65
  798. neural_compressor-2.2/neural_compressor/experimental/pruner_legacy/pruner.py +0 -138
  799. neural_compressor-2.2/neural_compressor/experimental/pruning.py +0 -493
  800. neural_compressor-2.2/neural_compressor/experimental/pruning_recipes/__init__.py +0 -24
  801. neural_compressor-2.2/neural_compressor/experimental/pruning_recipes/patterns/__init__.py +0 -30
  802. neural_compressor-2.2/neural_compressor/experimental/pruning_recipes/patterns/pattern.py +0 -105
  803. neural_compressor-2.2/neural_compressor/experimental/pruning_recipes/patterns/tile_pattern.py +0 -81
  804. neural_compressor-2.2/neural_compressor/experimental/pruning_v2.py +0 -523
  805. neural_compressor-2.2/neural_compressor/experimental/pytorch_pruner/logger.py +0 -19
  806. neural_compressor-2.2/neural_compressor/experimental/pytorch_pruner/patterns.py +0 -574
  807. neural_compressor-2.2/neural_compressor/experimental/pytorch_pruner/prune_utils.py +0 -221
  808. neural_compressor-2.2/neural_compressor/experimental/pytorch_pruner/pruner.py +0 -347
  809. neural_compressor-2.2/neural_compressor/experimental/pytorch_pruner/pruning.py +0 -167
  810. neural_compressor-2.2/neural_compressor/experimental/pytorch_pruner/scheduler.py +0 -164
  811. neural_compressor-2.2/neural_compressor/experimental/quantization.py +0 -452
  812. neural_compressor-2.2/neural_compressor/experimental/scheduler.py +0 -404
  813. neural_compressor-2.2/neural_compressor/experimental/strategy/__init__.py +0 -30
  814. neural_compressor-2.2/neural_compressor/experimental/strategy/auto_mixed_precision.py +0 -156
  815. neural_compressor-2.2/neural_compressor/experimental/strategy/basic.py +0 -166
  816. neural_compressor-2.2/neural_compressor/experimental/strategy/bayesian.py +0 -441
  817. neural_compressor-2.2/neural_compressor/experimental/strategy/exhaustive.py +0 -45
  818. neural_compressor-2.2/neural_compressor/experimental/strategy/mse.py +0 -197
  819. neural_compressor-2.2/neural_compressor/experimental/strategy/mse_v2.py +0 -209
  820. neural_compressor-2.2/neural_compressor/experimental/strategy/random.py +0 -55
  821. neural_compressor-2.2/neural_compressor/experimental/strategy/strategy.py +0 -1295
  822. neural_compressor-2.2/neural_compressor/experimental/strategy/utils/constant.py +0 -35
  823. neural_compressor-2.2/neural_compressor/experimental/strategy/utils/tuning_sampler.py +0 -463
  824. neural_compressor-2.2/neural_compressor/experimental/strategy/utils/tuning_space.py +0 -702
  825. neural_compressor-2.2/neural_compressor/experimental/strategy/utils/tuning_structs.py +0 -104
  826. neural_compressor-2.2/neural_compressor/experimental/strategy/utils/utility.py +0 -57
  827. neural_compressor-2.2/neural_compressor/metric/__init__.py +0 -34
  828. neural_compressor-2.2/neural_compressor/metric/bleu.py +0 -139
  829. neural_compressor-2.2/neural_compressor/metric/bleu_util.py +0 -139
  830. neural_compressor-2.2/neural_compressor/metric/coco_label_map.py +0 -103
  831. neural_compressor-2.2/neural_compressor/metric/coco_tools.py +0 -713
  832. neural_compressor-2.2/neural_compressor/metric/evaluate_squad.py +0 -120
  833. neural_compressor-2.2/neural_compressor/metric/f1.py +0 -144
  834. neural_compressor-2.2/neural_compressor/metric/metric.py +0 -1672
  835. neural_compressor-2.2/neural_compressor/mix_precision.py +0 -174
  836. neural_compressor-2.2/neural_compressor/model/__init__.py +0 -25
  837. neural_compressor-2.2/neural_compressor/model/base_model.py +0 -64
  838. neural_compressor-2.2/neural_compressor/model/keras_model.py +0 -148
  839. neural_compressor-2.2/neural_compressor/model/model.py +0 -251
  840. neural_compressor-2.2/neural_compressor/model/mxnet_model.py +0 -71
  841. neural_compressor-2.2/neural_compressor/model/nets_factory.py +0 -83
  842. neural_compressor-2.2/neural_compressor/model/onnx_model.py +0 -763
  843. neural_compressor-2.2/neural_compressor/model/tensorflow_model.py +0 -1186
  844. neural_compressor-2.2/neural_compressor/model/torch_model.py +0 -440
  845. neural_compressor-2.2/neural_compressor/objective.py +0 -549
  846. neural_compressor-2.2/neural_compressor/profiling/parser/factory.py +0 -49
  847. neural_compressor-2.2/neural_compressor/profiling/parser/onnx_parser/factory.py +0 -41
  848. neural_compressor-2.2/neural_compressor/profiling/parser/onnx_parser/parser.py +0 -71
  849. neural_compressor-2.2/neural_compressor/profiling/parser/parser.py +0 -77
  850. neural_compressor-2.2/neural_compressor/profiling/parser/result.py +0 -64
  851. neural_compressor-2.2/neural_compressor/profiling/parser/tensorflow_parser/factory.py +0 -41
  852. neural_compressor-2.2/neural_compressor/profiling/parser/tensorflow_parser/parser.py +0 -107
  853. neural_compressor-2.2/neural_compressor/profiling/profiler/factory.py +0 -56
  854. neural_compressor-2.2/neural_compressor/profiling/profiler/onnxrt_profiler/factory.py +0 -46
  855. neural_compressor-2.2/neural_compressor/profiling/profiler/onnxrt_profiler/profiler.py +0 -91
  856. neural_compressor-2.2/neural_compressor/profiling/profiler/tensorflow_profiler/factory.py +0 -56
  857. neural_compressor-2.2/neural_compressor/profiling/profiler/tensorflow_profiler/profiler.py +0 -133
  858. neural_compressor-2.2/neural_compressor/profiling/profiler/tensorflow_profiler/utils.py +0 -86
  859. neural_compressor-2.2/neural_compressor/quantization.py +0 -242
  860. neural_compressor-2.2/neural_compressor/strategy/__init__.py +0 -30
  861. neural_compressor-2.2/neural_compressor/strategy/auto.py +0 -113
  862. neural_compressor-2.2/neural_compressor/strategy/auto_mixed_precision.py +0 -180
  863. neural_compressor-2.2/neural_compressor/strategy/basic.py +0 -381
  864. neural_compressor-2.2/neural_compressor/strategy/bayesian.py +0 -471
  865. neural_compressor-2.2/neural_compressor/strategy/conservative.py +0 -226
  866. neural_compressor-2.2/neural_compressor/strategy/exhaustive.py +0 -45
  867. neural_compressor-2.2/neural_compressor/strategy/hawq_v2.py +0 -113
  868. neural_compressor-2.2/neural_compressor/strategy/mse.py +0 -228
  869. neural_compressor-2.2/neural_compressor/strategy/mse_v2.py +0 -198
  870. neural_compressor-2.2/neural_compressor/strategy/random.py +0 -55
  871. neural_compressor-2.2/neural_compressor/strategy/strategy.py +0 -1813
  872. neural_compressor-2.2/neural_compressor/strategy/utils/constant.py +0 -36
  873. neural_compressor-2.2/neural_compressor/strategy/utils/tuning_sampler.py +0 -560
  874. neural_compressor-2.2/neural_compressor/strategy/utils/tuning_space.py +0 -756
  875. neural_compressor-2.2/neural_compressor/strategy/utils/tuning_structs.py +0 -103
  876. neural_compressor-2.2/neural_compressor/strategy/utils/utility.py +0 -89
  877. neural_compressor-2.2/neural_compressor/training.py +0 -480
  878. neural_compressor-2.2/neural_compressor/utils/__init__.py +0 -26
  879. neural_compressor-2.2/neural_compressor/utils/collect_layer_histogram.py +0 -69
  880. neural_compressor-2.2/neural_compressor/utils/constant.py +0 -93
  881. neural_compressor-2.2/neural_compressor/utils/create_obj_from_config.py +0 -230
  882. neural_compressor-2.2/neural_compressor/utils/kl_divergence.py +0 -151
  883. neural_compressor-2.2/neural_compressor/utils/load_huggingface.py +0 -230
  884. neural_compressor-2.2/neural_compressor/utils/logger.py +0 -143
  885. neural_compressor-2.2/neural_compressor/utils/neural_insights_utils.py +0 -121
  886. neural_compressor-2.2/neural_compressor/utils/options.py +0 -41
  887. neural_compressor-2.2/neural_compressor/utils/pytorch.py +0 -399
  888. neural_compressor-2.2/neural_compressor/utils/utility.py +0 -1076
  889. neural_compressor-2.2/neural_compressor/utils/weights_details.py +0 -77
  890. neural_compressor-2.2/neural_compressor/version.py +0 -19
  891. neural_compressor-2.2/neural_compressor.egg-info/PKG-INFO +0 -173
  892. neural_compressor-2.2/neural_compressor.egg-info/SOURCES.txt +0 -501
  893. neural_compressor-2.2/neural_compressor.egg-info/requires.txt +0 -18
  894. neural_compressor-2.2/setup.py +0 -107
  895. {neural_compressor-2.2 → neural_compressor-2.3}/LICENSE +0 -0
  896. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/__main__.py +0 -0
  897. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/backends/__init__.py +0 -0
  898. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/backends/intel_extension_for_transformers.yaml +0 -0
  899. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/backends/keras_inc.yaml +0 -0
  900. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/backends/nano_jit_fp32.yaml +0 -0
  901. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/backends/nano_jit_fp32_ipex.yaml +0 -0
  902. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/backends/onnx_inc_dynamic_quant.yaml +0 -0
  903. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/backends/onnx_inc_static_quant_qdq.yaml +0 -0
  904. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/backends/onnx_inc_static_quant_qlinear.yaml +0 -0
  905. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/backends/pytorch_benchmark.yaml +0 -0
  906. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/backends/pytorch_channels_last.yaml +0 -0
  907. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/backends/pytorch_inc_bf16.yaml +0 -0
  908. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/backends/pytorch_inc_dynamic_quant.yaml +0 -0
  909. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/backends/pytorch_inc_dynamic_quant_fp8.yaml +0 -0
  910. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/backends/pytorch_inc_huggingface_optimum_dynamic.yaml +0 -0
  911. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/backends/pytorch_inc_huggingface_optimum_static.yaml +0 -0
  912. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/backends/pytorch_inc_static_quant_ipex.yaml +0 -0
  913. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/backends/pytorch_ipex_bf16.yaml +0 -0
  914. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/backends/pytorch_ipex_fp32.yaml +0 -0
  915. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/backends/pytorch_ipex_int8_dynamic_quant.yaml +0 -0
  916. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/backends/pytorch_ipex_int8_static_quant.yaml +0 -0
  917. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/backends/pytorch_jit_trace.yaml +0 -0
  918. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/backends/pytorch_jit_trace_ofi.yaml +0 -0
  919. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/backends/pytorch_mixed_precision_cuda.yaml +0 -0
  920. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/backends/pytorch_mixed_precision_intel_gpu.yaml +0 -0
  921. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/backends/pytorch_torchdynamo_jit_script.yaml +0 -0
  922. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/backends/pytorch_torchdynamo_jit_script_ofi.yaml +0 -0
  923. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/backends/pytorch_torchdynamo_jit_trace.yaml +0 -0
  924. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/backends/pytorch_torchdynamo_jit_trace_ofi.yaml +0 -0
  925. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/backends/template.yaml +0 -0
  926. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/coders/__init__.py +0 -0
  927. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/coders/autoinc/__init__.py +0 -0
  928. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/coders/pytorch/__init__.py +0 -0
  929. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/coders/tensorflow/__init__.py +0 -0
  930. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/graphers/__init__.py +0 -0
  931. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/graphers/preloads/__init__.py +0 -0
  932. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/utils/__init__.py +0 -0
  933. {neural_compressor-2.2 → neural_compressor-2.3}/neural_coder/version.py +0 -0
  934. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor/adaptor/ox_utils/__init__.py +0 -0
  935. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor/adaptor/tensorflow_itex.yaml +0 -0
  936. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor/adaptor/tf_utils/__init__.py +0 -0
  937. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor/adaptor/tf_utils/graph_rewriter/__init__.py +0 -0
  938. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor/adaptor/tf_utils/graph_rewriter/bf16/__init__.py +0 -0
  939. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/__init__.py +0 -0
  940. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/__init__.py +0 -0
  941. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor/adaptor/tf_utils/graph_rewriter/onnx/__init__.py +0 -0
  942. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor/adaptor/tf_utils/graph_rewriter/qdq/__init__.py +0 -0
  943. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor/adaptor/tf_utils/quantize_graph/__init__.py +0 -0
  944. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor/adaptor/tf_utils/quantize_graph/qat/__init__.py +0 -0
  945. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor/adaptor/tf_utils/quantize_graph/qat/quantize_layers/__init__.py +0 -0
  946. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor/adaptor/tf_utils/quantize_graph/qdq/__init__.py +0 -0
  947. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor/adaptor/tf_utils/transform_graph/__init__.py +0 -0
  948. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor/adaptor/torch_utils/__init__.py +0 -0
  949. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor/experimental/data/dataloaders/__init__.py +0 -0
  950. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor/experimental/nas/__init__.py +0 -0
  951. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor/experimental/pytorch_pruner/__init__.py +0 -0
  952. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor/experimental/strategy/utils/__init__.py +0 -0
  953. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor/profiling/__init__.py +0 -0
  954. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor/profiling/parser/__init__.py +0 -0
  955. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor/profiling/parser/onnx_parser/__init__.py +0 -0
  956. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor/profiling/parser/tensorflow_parser/__init__.py +0 -0
  957. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor/profiling/profiler/__init__.py +0 -0
  958. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor/profiling/profiler/onnxrt_profiler/__init__.py +0 -0
  959. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor/profiling/profiler/onnxrt_profiler/utils.py +0 -0
  960. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor/profiling/profiler/profiler.py +0 -0
  961. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor/profiling/profiler/tensorflow_profiler/__init__.py +0 -0
  962. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor/strategy/utils/__init__.py +0 -0
  963. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor.egg-info/dependency_links.txt +0 -0
  964. {neural_compressor-2.2 → neural_compressor-2.3}/neural_compressor.egg-info/top_level.txt +0 -0
  965. {neural_compressor-2.2 → neural_compressor-2.3}/setup.cfg +0 -0
@@ -0,0 +1,191 @@
1
+ Metadata-Version: 2.1
2
+ Name: neural_compressor
3
+ Version: 2.3
4
+ Summary: Repository of Intel® Neural Compressor
5
+ Home-page: https://github.com/intel/neural-compressor
6
+ Author: Intel AIA Team
7
+ Author-email: feng.tian@intel.com, haihao.shen@intel.com, suyue.chen@intel.com
8
+ License: Apache 2.0
9
+ Keywords: quantization,auto-tuning,post-training static quantization,post-training dynamic quantization,quantization-aware training
10
+ Classifier: Intended Audience :: Science/Research
11
+ Classifier: Programming Language :: Python :: 3
12
+ Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
13
+ Classifier: License :: OSI Approved :: Apache Software License
14
+ Requires-Python: >=3.6.0
15
+ Description-Content-Type: text/markdown
16
+ License-File: LICENSE
17
+ Requires-Dist: deprecated>=1.2.13
18
+ Requires-Dist: numpy
19
+ Requires-Dist: opencv-python-headless
20
+ Requires-Dist: pandas
21
+ Requires-Dist: Pillow
22
+ Requires-Dist: prettytable
23
+ Requires-Dist: psutil
24
+ Requires-Dist: py-cpuinfo
25
+ Requires-Dist: pycocotools; sys_platform != "win32" or python_version > "3.8"
26
+ Requires-Dist: pycocotools-windows; sys_platform == "win32" and python_version <= "3.8"
27
+ Requires-Dist: pyyaml
28
+ Requires-Dist: requests
29
+ Requires-Dist: schema
30
+ Requires-Dist: scikit-learn
31
+
32
+ <div align="center">
33
+
34
+ Intel® Neural Compressor
35
+ ===========================
36
+ <h3> An open-source Python library supporting popular model compression techniques on all mainstream deep learning frameworks (TensorFlow, PyTorch, ONNX Runtime, and MXNet)</h3>
37
+
38
+ [![python](https://img.shields.io/badge/python-3.7%2B-blue)](https://github.com/intel/neural-compressor)
39
+ [![version](https://img.shields.io/badge/release-2.3-green)](https://github.com/intel/neural-compressor/releases)
40
+ [![license](https://img.shields.io/badge/license-Apache%202-blue)](https://github.com/intel/neural-compressor/blob/master/LICENSE)
41
+ [![coverage](https://img.shields.io/badge/coverage-85%25-green)](https://github.com/intel/neural-compressor)
42
+ [![Downloads](https://static.pepy.tech/personalized-badge/neural-compressor?period=total&units=international_system&left_color=grey&right_color=green&left_text=downloads)](https://pepy.tech/project/neural-compressor)
43
+
44
+ [Architecture](./docs/source/design.md#architecture)&nbsp;&nbsp;&nbsp;|&nbsp;&nbsp;&nbsp;[Workflow](./docs/source/design.md#workflow)&nbsp;&nbsp;&nbsp;|&nbsp;&nbsp;&nbsp;[Results](./docs/source/validated_model_list.md)&nbsp;&nbsp;&nbsp;|&nbsp;&nbsp;&nbsp;[Examples](./examples/README.md)&nbsp;&nbsp;&nbsp;|&nbsp;&nbsp;&nbsp;[Documentations](https://intel.github.io/neural-compressor)
45
+
46
+ ---
47
+ <div align="left">
48
+
49
+ Intel® Neural Compressor aims to provide popular model compression techniques such as quantization, pruning (sparsity), distillation, and neural architecture search on mainstream frameworks such as [TensorFlow](https://www.tensorflow.org/), [PyTorch](https://pytorch.org/), [ONNX Runtime](https://onnxruntime.ai/), and [MXNet](https://mxnet.apache.org/),
50
+ as well as Intel extensions such as [Intel Extension for TensorFlow](https://github.com/intel/intel-extension-for-tensorflow) and [Intel Extension for PyTorch](https://github.com/intel/intel-extension-for-pytorch).
51
+ In particular, the tool provides the key features, typical examples, and open collaborations as below:
52
+
53
+ * Support a wide range of Intel hardware such as [Intel Xeon Scalable processor](https://www.intel.com/content/www/us/en/products/details/processors/xeon/scalable.html), [Intel Xeon CPU Max Series](https://www.intel.com/content/www/us/en/products/details/processors/xeon/max-series.html), [Intel Data Center GPU Flex Series](https://www.intel.com/content/www/us/en/products/details/discrete-gpus/data-center-gpu/flex-series.html), and [Intel Data Center GPU Max Series](https://www.intel.com/content/www/us/en/products/details/discrete-gpus/data-center-gpu/max-series.html) with extensive testing; support AMD CPU, ARM CPU, and NVidia GPU through ONNX Runtime with limited testing
54
+
55
+ * Validate popular LLMs such as LLama2, [LLama](examples/onnxrt/nlp/huggingface_model/text_generation/llama/quantization/ptq_static), [MPT](https://github.com/intel/intel-extension-for-transformers/blob/main/examples/huggingface/pytorch/text-generation/quantization/README.md), [Falcon](https://github.com/intel/intel-extension-for-transformers/blob/main/examples/huggingface/pytorch/language-modeling/quantization/README.md), [GPT-J](/examples/pytorch/nlp/huggingface_models/language-modeling/quantization/ptq_static/fx), [Bloom](/examples/pytorch/nlp/huggingface_models/language-modeling/quantization/ptq_static/ipex/smooth_quant), [OPT](/examples/pytorch/nlp/huggingface_models/language-modeling/quantization/ptq_static/ipex/smooth_quant), and more than 10,000 broad models such as [Stable Diffusion](/examples/pytorch/nlp/huggingface_models/text-to-image/quantization), [BERT-Large](/examples/pytorch/nlp/huggingface_models/text-classification/quantization/ptq_static/fx), and [ResNet50](/examples/pytorch/image_recognition/torchvision_models/quantization/ptq/cpu/fx) from popular model hubs such as [Hugging Face](https://huggingface.co/), [Torch Vision](https://pytorch.org/vision/stable/index.html), and [ONNX Model Zoo](https://github.com/onnx/models#models), by leveraging zero-code optimization solution [Neural Coder](/neural_coder#what-do-we-offer) and automatic [accuracy-driven](/docs/source/design.md#workflow) quantization strategies
56
+
57
+ * Collaborate with cloud marketplace such as [Google Cloud Platform](https://console.cloud.google.com/marketplace/product/bitnami-launchpad/inc-tensorflow-intel?project=verdant-sensor-286207), [Amazon Web Services](https://aws.amazon.com/marketplace/pp/prodview-yjyh2xmggbmga#pdp-support), and [Azure](https://azuremarketplace.microsoft.com/en-us/marketplace/apps/bitnami.inc-tensorflow-intel), software platforms such as [Alibaba Cloud](https://www.intel.com/content/www/us/en/developer/articles/technical/quantize-ai-by-oneapi-analytics-on-alibaba-cloud.html), [Tencent TACO](https://new.qq.com/rain/a/20221202A00B9S00) and [Microsoft Olive](https://github.com/microsoft/Olive), and open AI ecosystem such as [Hugging Face](https://huggingface.co/blog/intel), [PyTorch](https://pytorch.org/tutorials/recipes/intel_neural_compressor_for_pytorch.html), [ONNX](https://github.com/onnx/models#models), [ONNX Runtime](https://github.com/microsoft/onnxruntime), and [Lightning AI](https://github.com/Lightning-AI/lightning/blob/master/docs/source-pytorch/advanced/post_training_quantization.rst)
58
+
59
+ ## Installation
60
+
61
+ ### Install from pypi
62
+ ```Shell
63
+ pip install neural-compressor
64
+ ```
65
+ > More installation methods can be found at [Installation Guide](./docs/source/installation_guide.md). Please check out our [FAQ](./docs/source/faq.md) for more details.
66
+
67
+ ## Getting Started
68
+ ### Quantization with Python API
69
+
70
+ ```shell
71
+ # Install Intel Neural Compressor and TensorFlow
72
+ pip install neural-compressor
73
+ pip install tensorflow
74
+ # Prepare fp32 model
75
+ wget https://storage.googleapis.com/intel-optimized-tensorflow/models/v1_6/mobilenet_v1_1.0_224_frozen.pb
76
+ ```
77
+ ```python
78
+ from neural_compressor.data import DataLoader, Datasets
79
+ from neural_compressor.config import PostTrainingQuantConfig
80
+
81
+ dataset = Datasets("tensorflow")["dummy"](shape=(1, 224, 224, 3))
82
+ dataloader = DataLoader(framework="tensorflow", dataset=dataset)
83
+
84
+ from neural_compressor.quantization import fit
85
+
86
+ q_model = fit(
87
+ model="./mobilenet_v1_1.0_224_frozen.pb",
88
+ conf=PostTrainingQuantConfig(),
89
+ calib_dataloader=dataloader,
90
+ )
91
+ ```
92
+
93
+ ## Documentation
94
+
95
+ <table class="docutils">
96
+ <thead>
97
+ <tr>
98
+ <th colspan="8">Overview</th>
99
+ </tr>
100
+ </thead>
101
+ <tbody>
102
+ <tr>
103
+ <td colspan="2" align="center"><a href="./docs/source/design.md#architecture">Architecture</a></td>
104
+ <td colspan="2" align="center"><a href="./docs/source/design.md#workflow">Workflow</a></td>
105
+ <td colspan="2" align="center"><a href="examples/README.md">Examples</a></td>
106
+ <td colspan="2" align="center"><a href="https://intel.github.io/neural-compressor/latest/docs/source/api-doc/apis.html">APIs</a></td>
107
+ </tr>
108
+ </tbody>
109
+ <thead>
110
+ <tr>
111
+ <th colspan="8">Python-based APIs</th>
112
+ </tr>
113
+ </thead>
114
+ <tbody>
115
+ <tr>
116
+ <td colspan="2" align="center"><a href="./docs/source/quantization.md">Quantization</a></td>
117
+ <td colspan="2" align="center"><a href="./docs/source/mixed_precision.md">Advanced Mixed Precision</a></td>
118
+ <td colspan="2" align="center"><a href="./docs/source/pruning.md">Pruning (Sparsity)</a></td>
119
+ <td colspan="2" align="center"><a href="./docs/source/distillation.md">Distillation</a></td>
120
+ </tr>
121
+ <tr>
122
+ <td colspan="2" align="center"><a href="./docs/source/orchestration.md">Orchestration</a></td>
123
+ <td colspan="2" align="center"><a href="./docs/source/benchmark.md">Benchmarking</a></td>
124
+ <td colspan="2" align="center"><a href="./docs/source/distributed.md">Distributed Compression</a></td>
125
+ <td colspan="2" align="center"><a href="./docs/source/export.md">Model Export</a></td>
126
+ </tr>
127
+ </tbody>
128
+ <thead>
129
+ <tr>
130
+ <th colspan="8">Neural Coder (Zero-code Optimization)</th>
131
+ </tr>
132
+ </thead>
133
+ <tbody>
134
+ <tr>
135
+ <td colspan="2" align="center"><a href="./neural_coder/docs/PythonLauncher.md">Launcher</a></td>
136
+ <td colspan="2" align="center"><a href="./neural_coder/extensions/neural_compressor_ext_lab/README.md">JupyterLab Extension</a></td>
137
+ <td colspan="2" align="center"><a href="./neural_coder/extensions/neural_compressor_ext_vscode/README.md">Visual Studio Code Extension</a></td>
138
+ <td colspan="2" align="center"><a href="./neural_coder/docs/SupportMatrix.md">Supported Matrix</a></td>
139
+ </tr>
140
+ </tbody>
141
+ <thead>
142
+ <tr>
143
+ <th colspan="8">Advanced Topics</th>
144
+ </tr>
145
+ </thead>
146
+ <tbody>
147
+ <tr>
148
+ <td colspan="2" align="center"><a href="./docs/source/adaptor.md">Adaptor</a></td>
149
+ <td colspan="2" align="center"><a href="./docs/source/tuning_strategies.md">Strategy</a></td>
150
+ <td colspan="2" align="center"><a href="./docs/source/distillation_quantization.md">Distillation for Quantization</a></td>
151
+ <td colspan="2" align="center"><a href="./docs/source/smooth_quant.md">SmoothQuant</td>
152
+ </tr>
153
+ <tr>
154
+ <td colspan="8" align="center"><a href="./docs/source/quantization_weight_only.md">Weight-Only Quantization (INT8/INT4/FP4/NF4) </td>
155
+ </tr>
156
+ </tbody>
157
+ <thead>
158
+ <tr>
159
+ <th colspan="8">Innovations for Productivity</th>
160
+ </tr>
161
+ </thead>
162
+ <tbody>
163
+ <tr>
164
+ <td colspan="4" align="center"><a href="./neural_insights/README.md">Neural Insights</a></td>
165
+ <td colspan="4" align="center"><a href="./neural_solution/README.md">Neural Solution</a></td>
166
+ </tr>
167
+ </tbody>
168
+ </table>
169
+
170
+ > More documentations can be found at [User Guide](./docs/source/user_guide.md).
171
+
172
+ ## Selected Publications/Events
173
+ * arXiv: [Optimize Weight Rounding via Signed Gradient Descent for the Quantization of LLMs](https://arxiv.org/abs/2309.05516) (Sep 2023)
174
+ * Post on Social Media: [ONNXCommunityMeetup2023: INT8 Quantization for Large Language Models with Intel Neural Compressor](https://www.youtube.com/watch?v=luYBWA1Q5pQ) (July 2023)
175
+ * Blog by Intel: [Accelerate Llama 2 with Intel AI Hardware and Software Optimizations](https://www.intel.com/content/www/us/en/developer/articles/news/llama2.html) (July 2023)
176
+ * NeurIPS'2022: [Fast Distilbert on CPUs](https://arxiv.org/abs/2211.07715) (Oct 2022)
177
+ * NeurIPS'2022: [QuaLA-MiniLM: a Quantized Length Adaptive MiniLM](https://arxiv.org/abs/2210.17114) (Oct 2022)
178
+
179
+ > View [Full Publication List](./docs/source/publication_list.md).
180
+
181
+ ## Additional Content
182
+
183
+ * [Release Information](./docs/source/releases_info.md)
184
+ * [Contribution Guidelines](./docs/source/CONTRIBUTING.md)
185
+ * [Legal Information](./docs/source/legal_information.md)
186
+ * [Security Policy](SECURITY.md)
187
+
188
+ ## Communication
189
+ - [GitHub Issues](https://github.com/intel/neural-compressor/issues): mainly for bugs report, new feature request, question asking, etc.
190
+ - [Email](mailto:inc.maintainers@intel.com): welcome to raise any interesting research ideas on model compression techniques by email for collaborations.
191
+ - [WeChat group](/docs/source/imgs/wechat_group.jpg): scan the QA code to join the technical discussion.
@@ -0,0 +1,160 @@
1
+ <div align="center">
2
+
3
+ Intel® Neural Compressor
4
+ ===========================
5
+ <h3> An open-source Python library supporting popular model compression techniques on all mainstream deep learning frameworks (TensorFlow, PyTorch, ONNX Runtime, and MXNet)</h3>
6
+
7
+ [![python](https://img.shields.io/badge/python-3.7%2B-blue)](https://github.com/intel/neural-compressor)
8
+ [![version](https://img.shields.io/badge/release-2.3-green)](https://github.com/intel/neural-compressor/releases)
9
+ [![license](https://img.shields.io/badge/license-Apache%202-blue)](https://github.com/intel/neural-compressor/blob/master/LICENSE)
10
+ [![coverage](https://img.shields.io/badge/coverage-85%25-green)](https://github.com/intel/neural-compressor)
11
+ [![Downloads](https://static.pepy.tech/personalized-badge/neural-compressor?period=total&units=international_system&left_color=grey&right_color=green&left_text=downloads)](https://pepy.tech/project/neural-compressor)
12
+
13
+ [Architecture](./docs/source/design.md#architecture)&nbsp;&nbsp;&nbsp;|&nbsp;&nbsp;&nbsp;[Workflow](./docs/source/design.md#workflow)&nbsp;&nbsp;&nbsp;|&nbsp;&nbsp;&nbsp;[Results](./docs/source/validated_model_list.md)&nbsp;&nbsp;&nbsp;|&nbsp;&nbsp;&nbsp;[Examples](./examples/README.md)&nbsp;&nbsp;&nbsp;|&nbsp;&nbsp;&nbsp;[Documentations](https://intel.github.io/neural-compressor)
14
+
15
+ ---
16
+ <div align="left">
17
+
18
+ Intel® Neural Compressor aims to provide popular model compression techniques such as quantization, pruning (sparsity), distillation, and neural architecture search on mainstream frameworks such as [TensorFlow](https://www.tensorflow.org/), [PyTorch](https://pytorch.org/), [ONNX Runtime](https://onnxruntime.ai/), and [MXNet](https://mxnet.apache.org/),
19
+ as well as Intel extensions such as [Intel Extension for TensorFlow](https://github.com/intel/intel-extension-for-tensorflow) and [Intel Extension for PyTorch](https://github.com/intel/intel-extension-for-pytorch).
20
+ In particular, the tool provides the key features, typical examples, and open collaborations as below:
21
+
22
+ * Support a wide range of Intel hardware such as [Intel Xeon Scalable processor](https://www.intel.com/content/www/us/en/products/details/processors/xeon/scalable.html), [Intel Xeon CPU Max Series](https://www.intel.com/content/www/us/en/products/details/processors/xeon/max-series.html), [Intel Data Center GPU Flex Series](https://www.intel.com/content/www/us/en/products/details/discrete-gpus/data-center-gpu/flex-series.html), and [Intel Data Center GPU Max Series](https://www.intel.com/content/www/us/en/products/details/discrete-gpus/data-center-gpu/max-series.html) with extensive testing; support AMD CPU, ARM CPU, and NVidia GPU through ONNX Runtime with limited testing
23
+
24
+ * Validate popular LLMs such as LLama2, [LLama](examples/onnxrt/nlp/huggingface_model/text_generation/llama/quantization/ptq_static), [MPT](https://github.com/intel/intel-extension-for-transformers/blob/main/examples/huggingface/pytorch/text-generation/quantization/README.md), [Falcon](https://github.com/intel/intel-extension-for-transformers/blob/main/examples/huggingface/pytorch/language-modeling/quantization/README.md), [GPT-J](/examples/pytorch/nlp/huggingface_models/language-modeling/quantization/ptq_static/fx), [Bloom](/examples/pytorch/nlp/huggingface_models/language-modeling/quantization/ptq_static/ipex/smooth_quant), [OPT](/examples/pytorch/nlp/huggingface_models/language-modeling/quantization/ptq_static/ipex/smooth_quant), and more than 10,000 broad models such as [Stable Diffusion](/examples/pytorch/nlp/huggingface_models/text-to-image/quantization), [BERT-Large](/examples/pytorch/nlp/huggingface_models/text-classification/quantization/ptq_static/fx), and [ResNet50](/examples/pytorch/image_recognition/torchvision_models/quantization/ptq/cpu/fx) from popular model hubs such as [Hugging Face](https://huggingface.co/), [Torch Vision](https://pytorch.org/vision/stable/index.html), and [ONNX Model Zoo](https://github.com/onnx/models#models), by leveraging zero-code optimization solution [Neural Coder](/neural_coder#what-do-we-offer) and automatic [accuracy-driven](/docs/source/design.md#workflow) quantization strategies
25
+
26
+ * Collaborate with cloud marketplace such as [Google Cloud Platform](https://console.cloud.google.com/marketplace/product/bitnami-launchpad/inc-tensorflow-intel?project=verdant-sensor-286207), [Amazon Web Services](https://aws.amazon.com/marketplace/pp/prodview-yjyh2xmggbmga#pdp-support), and [Azure](https://azuremarketplace.microsoft.com/en-us/marketplace/apps/bitnami.inc-tensorflow-intel), software platforms such as [Alibaba Cloud](https://www.intel.com/content/www/us/en/developer/articles/technical/quantize-ai-by-oneapi-analytics-on-alibaba-cloud.html), [Tencent TACO](https://new.qq.com/rain/a/20221202A00B9S00) and [Microsoft Olive](https://github.com/microsoft/Olive), and open AI ecosystem such as [Hugging Face](https://huggingface.co/blog/intel), [PyTorch](https://pytorch.org/tutorials/recipes/intel_neural_compressor_for_pytorch.html), [ONNX](https://github.com/onnx/models#models), [ONNX Runtime](https://github.com/microsoft/onnxruntime), and [Lightning AI](https://github.com/Lightning-AI/lightning/blob/master/docs/source-pytorch/advanced/post_training_quantization.rst)
27
+
28
+ ## Installation
29
+
30
+ ### Install from pypi
31
+ ```Shell
32
+ pip install neural-compressor
33
+ ```
34
+ > More installation methods can be found at [Installation Guide](./docs/source/installation_guide.md). Please check out our [FAQ](./docs/source/faq.md) for more details.
35
+
36
+ ## Getting Started
37
+ ### Quantization with Python API
38
+
39
+ ```shell
40
+ # Install Intel Neural Compressor and TensorFlow
41
+ pip install neural-compressor
42
+ pip install tensorflow
43
+ # Prepare fp32 model
44
+ wget https://storage.googleapis.com/intel-optimized-tensorflow/models/v1_6/mobilenet_v1_1.0_224_frozen.pb
45
+ ```
46
+ ```python
47
+ from neural_compressor.data import DataLoader, Datasets
48
+ from neural_compressor.config import PostTrainingQuantConfig
49
+
50
+ dataset = Datasets("tensorflow")["dummy"](shape=(1, 224, 224, 3))
51
+ dataloader = DataLoader(framework="tensorflow", dataset=dataset)
52
+
53
+ from neural_compressor.quantization import fit
54
+
55
+ q_model = fit(
56
+ model="./mobilenet_v1_1.0_224_frozen.pb",
57
+ conf=PostTrainingQuantConfig(),
58
+ calib_dataloader=dataloader,
59
+ )
60
+ ```
61
+
62
+ ## Documentation
63
+
64
+ <table class="docutils">
65
+ <thead>
66
+ <tr>
67
+ <th colspan="8">Overview</th>
68
+ </tr>
69
+ </thead>
70
+ <tbody>
71
+ <tr>
72
+ <td colspan="2" align="center"><a href="./docs/source/design.md#architecture">Architecture</a></td>
73
+ <td colspan="2" align="center"><a href="./docs/source/design.md#workflow">Workflow</a></td>
74
+ <td colspan="2" align="center"><a href="examples/README.md">Examples</a></td>
75
+ <td colspan="2" align="center"><a href="https://intel.github.io/neural-compressor/latest/docs/source/api-doc/apis.html">APIs</a></td>
76
+ </tr>
77
+ </tbody>
78
+ <thead>
79
+ <tr>
80
+ <th colspan="8">Python-based APIs</th>
81
+ </tr>
82
+ </thead>
83
+ <tbody>
84
+ <tr>
85
+ <td colspan="2" align="center"><a href="./docs/source/quantization.md">Quantization</a></td>
86
+ <td colspan="2" align="center"><a href="./docs/source/mixed_precision.md">Advanced Mixed Precision</a></td>
87
+ <td colspan="2" align="center"><a href="./docs/source/pruning.md">Pruning (Sparsity)</a></td>
88
+ <td colspan="2" align="center"><a href="./docs/source/distillation.md">Distillation</a></td>
89
+ </tr>
90
+ <tr>
91
+ <td colspan="2" align="center"><a href="./docs/source/orchestration.md">Orchestration</a></td>
92
+ <td colspan="2" align="center"><a href="./docs/source/benchmark.md">Benchmarking</a></td>
93
+ <td colspan="2" align="center"><a href="./docs/source/distributed.md">Distributed Compression</a></td>
94
+ <td colspan="2" align="center"><a href="./docs/source/export.md">Model Export</a></td>
95
+ </tr>
96
+ </tbody>
97
+ <thead>
98
+ <tr>
99
+ <th colspan="8">Neural Coder (Zero-code Optimization)</th>
100
+ </tr>
101
+ </thead>
102
+ <tbody>
103
+ <tr>
104
+ <td colspan="2" align="center"><a href="./neural_coder/docs/PythonLauncher.md">Launcher</a></td>
105
+ <td colspan="2" align="center"><a href="./neural_coder/extensions/neural_compressor_ext_lab/README.md">JupyterLab Extension</a></td>
106
+ <td colspan="2" align="center"><a href="./neural_coder/extensions/neural_compressor_ext_vscode/README.md">Visual Studio Code Extension</a></td>
107
+ <td colspan="2" align="center"><a href="./neural_coder/docs/SupportMatrix.md">Supported Matrix</a></td>
108
+ </tr>
109
+ </tbody>
110
+ <thead>
111
+ <tr>
112
+ <th colspan="8">Advanced Topics</th>
113
+ </tr>
114
+ </thead>
115
+ <tbody>
116
+ <tr>
117
+ <td colspan="2" align="center"><a href="./docs/source/adaptor.md">Adaptor</a></td>
118
+ <td colspan="2" align="center"><a href="./docs/source/tuning_strategies.md">Strategy</a></td>
119
+ <td colspan="2" align="center"><a href="./docs/source/distillation_quantization.md">Distillation for Quantization</a></td>
120
+ <td colspan="2" align="center"><a href="./docs/source/smooth_quant.md">SmoothQuant</td>
121
+ </tr>
122
+ <tr>
123
+ <td colspan="8" align="center"><a href="./docs/source/quantization_weight_only.md">Weight-Only Quantization (INT8/INT4/FP4/NF4) </td>
124
+ </tr>
125
+ </tbody>
126
+ <thead>
127
+ <tr>
128
+ <th colspan="8">Innovations for Productivity</th>
129
+ </tr>
130
+ </thead>
131
+ <tbody>
132
+ <tr>
133
+ <td colspan="4" align="center"><a href="./neural_insights/README.md">Neural Insights</a></td>
134
+ <td colspan="4" align="center"><a href="./neural_solution/README.md">Neural Solution</a></td>
135
+ </tr>
136
+ </tbody>
137
+ </table>
138
+
139
+ > More documentations can be found at [User Guide](./docs/source/user_guide.md).
140
+
141
+ ## Selected Publications/Events
142
+ * arXiv: [Optimize Weight Rounding via Signed Gradient Descent for the Quantization of LLMs](https://arxiv.org/abs/2309.05516) (Sep 2023)
143
+ * Post on Social Media: [ONNXCommunityMeetup2023: INT8 Quantization for Large Language Models with Intel Neural Compressor](https://www.youtube.com/watch?v=luYBWA1Q5pQ) (July 2023)
144
+ * Blog by Intel: [Accelerate Llama 2 with Intel AI Hardware and Software Optimizations](https://www.intel.com/content/www/us/en/developer/articles/news/llama2.html) (July 2023)
145
+ * NeurIPS'2022: [Fast Distilbert on CPUs](https://arxiv.org/abs/2211.07715) (Oct 2022)
146
+ * NeurIPS'2022: [QuaLA-MiniLM: a Quantized Length Adaptive MiniLM](https://arxiv.org/abs/2210.17114) (Oct 2022)
147
+
148
+ > View [Full Publication List](./docs/source/publication_list.md).
149
+
150
+ ## Additional Content
151
+
152
+ * [Release Information](./docs/source/releases_info.md)
153
+ * [Contribution Guidelines](./docs/source/CONTRIBUTING.md)
154
+ * [Legal Information](./docs/source/legal_information.md)
155
+ * [Security Policy](SECURITY.md)
156
+
157
+ ## Communication
158
+ - [GitHub Issues](https://github.com/intel/neural-compressor/issues): mainly for bugs report, new feature request, question asking, etc.
159
+ - [Email](mailto:inc.maintainers@intel.com): welcome to raise any interesting research ideas on model compression techniques by email for collaborations.
160
+ - [WeChat group](/docs/source/imgs/wechat_group.jpg): scan the QA code to join the technical discussion.
@@ -0,0 +1,20 @@
1
+ # Copyright (c) 2022 Intel Corporation
2
+ #
3
+ # Licensed under the Apache License, Version 2.0 (the "License");
4
+ # you may not use this file except in compliance with the License.
5
+ # You may obtain a copy of the License at
6
+ #
7
+ # http://www.apache.org/licenses/LICENSE-2.0
8
+ #
9
+ # Unless required by applicable law or agreed to in writing, software
10
+ # distributed under the License is distributed on an "AS IS" BASIS,
11
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12
+ # See the License for the specific language governing permissions and
13
+ # limitations under the License.
14
+
15
+ from .interface import enable
16
+ from .interface import bench
17
+ from .interface import superbench
18
+
19
+ # from .interface import superreport
20
+ from .interface import auto_quant
@@ -0,0 +1,27 @@
1
+ # Copyright (c) 2022 Intel Corporation
2
+ #
3
+ # Licensed under the Apache License, Version 2.0 (the "License");
4
+ # you may not use this file except in compliance with the License.
5
+ # You may obtain a copy of the License at
6
+ #
7
+ # http://www.apache.org/licenses/LICENSE-2.0
8
+ #
9
+ # Unless required by applicable law or agreed to in writing, software
10
+ # distributed under the License is distributed on an "AS IS" BASIS,
11
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12
+ # See the License for the specific language governing permissions and
13
+ # limitations under the License.
14
+
15
+ transformation:
16
+ location:
17
+ - ["insert_below_model_definition_line", "insert_below_input_definition_line"]
18
+ - "indent_inference_line"
19
+ content:
20
+ - |-
21
+ [+] from bigdl.nano.pytorch import InferenceOptimizer
22
+ [+] MODEL_NAME = InferenceOptimizer.quantize(MODEL_NAME, precision="bf16", input_sample=INPUT_NAME)
23
+ [+] with InferenceOptimizer.get_context(MODEL_NAME):
24
+ - 1
25
+ order:
26
+ - below:
27
+ above:
@@ -0,0 +1,27 @@
1
+ # Copyright (c) 2022 Intel Corporation
2
+ #
3
+ # Licensed under the Apache License, Version 2.0 (the "License");
4
+ # you may not use this file except in compliance with the License.
5
+ # You may obtain a copy of the License at
6
+ #
7
+ # http://www.apache.org/licenses/LICENSE-2.0
8
+ #
9
+ # Unless required by applicable law or agreed to in writing, software
10
+ # distributed under the License is distributed on an "AS IS" BASIS,
11
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12
+ # See the License for the specific language governing permissions and
13
+ # limitations under the License.
14
+
15
+ transformation:
16
+ location:
17
+ - ["insert_below_model_definition_line", "insert_below_input_definition_line"]
18
+ - "indent_inference_line"
19
+ content:
20
+ - |-
21
+ [+] from bigdl.nano.pytorch import InferenceOptimizer
22
+ [+] MODEL_NAME = InferenceOptimizer.quantize(MODEL_NAME, precision="bf16", channels_last=True, input_sample=INPUT_NAME)
23
+ [+] with InferenceOptimizer.get_context(MODEL_NAME):
24
+ - 1
25
+ order:
26
+ - below:
27
+ above:
@@ -0,0 +1,27 @@
1
+ # Copyright (c) 2022 Intel Corporation
2
+ #
3
+ # Licensed under the Apache License, Version 2.0 (the "License");
4
+ # you may not use this file except in compliance with the License.
5
+ # You may obtain a copy of the License at
6
+ #
7
+ # http://www.apache.org/licenses/LICENSE-2.0
8
+ #
9
+ # Unless required by applicable law or agreed to in writing, software
10
+ # distributed under the License is distributed on an "AS IS" BASIS,
11
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12
+ # See the License for the specific language governing permissions and
13
+ # limitations under the License.
14
+
15
+ transformation:
16
+ location:
17
+ - ["insert_below_model_definition_line", "insert_below_input_definition_line"]
18
+ - "indent_inference_line"
19
+ content:
20
+ - |-
21
+ [+] from bigdl.nano.pytorch import InferenceOptimizer
22
+ [+] MODEL_NAME = InferenceOptimizer.quantize(MODEL_NAME, precision="bf16", use_ipex=True, input_sample=INPUT_NAME)
23
+ [+] with InferenceOptimizer.get_context(MODEL_NAME):
24
+ - 1
25
+ order:
26
+ - below:
27
+ above:
@@ -0,0 +1,27 @@
1
+ # Copyright (c) 2022 Intel Corporation
2
+ #
3
+ # Licensed under the Apache License, Version 2.0 (the "License");
4
+ # you may not use this file except in compliance with the License.
5
+ # You may obtain a copy of the License at
6
+ #
7
+ # http://www.apache.org/licenses/LICENSE-2.0
8
+ #
9
+ # Unless required by applicable law or agreed to in writing, software
10
+ # distributed under the License is distributed on an "AS IS" BASIS,
11
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12
+ # See the License for the specific language governing permissions and
13
+ # limitations under the License.
14
+
15
+ transformation:
16
+ location:
17
+ - ["insert_below_model_definition_line", "insert_below_input_definition_line"]
18
+ - "indent_inference_line"
19
+ content:
20
+ - |-
21
+ [+] from bigdl.nano.pytorch import InferenceOptimizer
22
+ [+] MODEL_NAME = InferenceOptimizer.quantize(MODEL_NAME, precision="bf16", use_ipex=True, channels_last=True, input_sample=INPUT_NAME)
23
+ [+] with InferenceOptimizer.get_context(MODEL_NAME):
24
+ - 1
25
+ order:
26
+ - below:
27
+ above:
@@ -0,0 +1,27 @@
1
+ # Copyright (c) 2022 Intel Corporation
2
+ #
3
+ # Licensed under the Apache License, Version 2.0 (the "License");
4
+ # you may not use this file except in compliance with the License.
5
+ # You may obtain a copy of the License at
6
+ #
7
+ # http://www.apache.org/licenses/LICENSE-2.0
8
+ #
9
+ # Unless required by applicable law or agreed to in writing, software
10
+ # distributed under the License is distributed on an "AS IS" BASIS,
11
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12
+ # See the License for the specific language governing permissions and
13
+ # limitations under the License.
14
+
15
+ transformation:
16
+ location:
17
+ - ["insert_below_model_definition_line", "insert_below_input_definition_line"]
18
+ - "indent_inference_line"
19
+ content:
20
+ - |-
21
+ [+] from bigdl.nano.pytorch import InferenceOptimizer
22
+ [+] MODEL_NAME = InferenceOptimizer.trace(MODEL_NAME, channels_last=True, input_sample=INPUT_NAME)
23
+ [+] with InferenceOptimizer.get_context(MODEL_NAME):
24
+ - 1
25
+ order:
26
+ - below:
27
+ above:
@@ -0,0 +1,27 @@
1
+ # Copyright (c) 2022 Intel Corporation
2
+ #
3
+ # Licensed under the Apache License, Version 2.0 (the "License");
4
+ # you may not use this file except in compliance with the License.
5
+ # You may obtain a copy of the License at
6
+ #
7
+ # http://www.apache.org/licenses/LICENSE-2.0
8
+ #
9
+ # Unless required by applicable law or agreed to in writing, software
10
+ # distributed under the License is distributed on an "AS IS" BASIS,
11
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12
+ # See the License for the specific language governing permissions and
13
+ # limitations under the License.
14
+
15
+ transformation:
16
+ location:
17
+ - ["insert_below_model_definition_line", "insert_below_input_definition_line"]
18
+ - "indent_inference_line"
19
+ content:
20
+ - |-
21
+ [+] from bigdl.nano.pytorch import InferenceOptimizer
22
+ [+] MODEL_NAME = InferenceOptimizer.trace(MODEL_NAME, use_ipex=True, input_sample=INPUT_NAME)
23
+ [+] with InferenceOptimizer.get_context(MODEL_NAME):
24
+ - 1
25
+ order:
26
+ - below:
27
+ above:
@@ -0,0 +1,27 @@
1
+ # Copyright (c) 2022 Intel Corporation
2
+ #
3
+ # Licensed under the Apache License, Version 2.0 (the "License");
4
+ # you may not use this file except in compliance with the License.
5
+ # You may obtain a copy of the License at
6
+ #
7
+ # http://www.apache.org/licenses/LICENSE-2.0
8
+ #
9
+ # Unless required by applicable law or agreed to in writing, software
10
+ # distributed under the License is distributed on an "AS IS" BASIS,
11
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12
+ # See the License for the specific language governing permissions and
13
+ # limitations under the License.
14
+
15
+ transformation:
16
+ location:
17
+ - ["insert_below_model_definition_line", "insert_below_input_definition_line"]
18
+ - "indent_inference_line"
19
+ content:
20
+ - |-
21
+ [+] from bigdl.nano.pytorch import InferenceOptimizer
22
+ [+] MODEL_NAME = InferenceOptimizer.trace(MODEL_NAME, use_ipex=True, channels_last=True, input_sample=INPUT_NAME)
23
+ [+] with InferenceOptimizer.get_context(MODEL_NAME):
24
+ - 1
25
+ order:
26
+ - below:
27
+ above:
@@ -0,0 +1,24 @@
1
+ # Copyright (c) 2022 Intel Corporation
2
+ #
3
+ # Licensed under the Apache License, Version 2.0 (the "License");
4
+ # you may not use this file except in compliance with the License.
5
+ # You may obtain a copy of the License at
6
+ #
7
+ # http://www.apache.org/licenses/LICENSE-2.0
8
+ #
9
+ # Unless required by applicable law or agreed to in writing, software
10
+ # distributed under the License is distributed on an "AS IS" BASIS,
11
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12
+ # See the License for the specific language governing permissions and
13
+ # limitations under the License.
14
+
15
+ transformation:
16
+ location:
17
+ - ["insert_above_model_definition_line", "insert_above_input_definition_line"]
18
+ content:
19
+ - |-
20
+ [+] from bigdl.nano.pytorch import patch_torch
21
+ [+] patch_torch()
22
+ order:
23
+ - below:
24
+ above:
@@ -0,0 +1,27 @@
1
+ # Copyright (c) 2022 Intel Corporation
2
+ #
3
+ # Licensed under the Apache License, Version 2.0 (the "License");
4
+ # you may not use this file except in compliance with the License.
5
+ # You may obtain a copy of the License at
6
+ #
7
+ # http://www.apache.org/licenses/LICENSE-2.0
8
+ #
9
+ # Unless required by applicable law or agreed to in writing, software
10
+ # distributed under the License is distributed on an "AS IS" BASIS,
11
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12
+ # See the License for the specific language governing permissions and
13
+ # limitations under the License.
14
+
15
+ transformation:
16
+ location:
17
+ - ["insert_below_model_definition_line", "insert_below_input_definition_line"]
18
+ - "indent_inference_line"
19
+ content:
20
+ - |-
21
+ [+] from bigdl.nano.pytorch import InferenceOptimizer
22
+ [+] MODEL_NAME = InferenceOptimizer.quantize(MODEL_NAME, precision="int8", input_sample=INPUT_NAME)
23
+ [+] with InferenceOptimizer.get_context(MODEL_NAME):
24
+ - 1
25
+ order:
26
+ - below:
27
+ above: