neural-compressor 2.3.2__tar.gz → 2.4__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (540) hide show
  1. {neural_compressor-2.3.2 → neural_compressor-2.4}/PKG-INFO +24 -13
  2. {neural_compressor-2.3.2 → neural_compressor-2.4}/README.md +15 -11
  3. neural_compressor-2.4/neural_coder/backends/pytorch_inc_static_quant_ipex_xpu.yaml +34 -0
  4. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/graphers/function.py +1 -1
  5. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/interface.py +12 -0
  6. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/launcher.py +2 -0
  7. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/utils/numa_launcher.py +2 -2
  8. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/keras.py +1 -1
  9. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/onnxrt.py +318 -36
  10. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/onnxrt.yaml +93 -0
  11. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/ox_utils/calibration.py +38 -7
  12. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/ox_utils/operators/direct_q8.py +2 -1
  13. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/ox_utils/operators/gather.py +1 -1
  14. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/ox_utils/operators/lstm.py +7 -3
  15. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/ox_utils/operators/split.py +1 -1
  16. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/ox_utils/smooth_quant.py +1 -0
  17. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/ox_utils/util.py +47 -1
  18. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/ox_utils/weight_only.py +23 -11
  19. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/pytorch.py +217 -94
  20. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/pytorch_cpu.yaml +1 -0
  21. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/pytorch_ipex.yaml +82 -40
  22. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tensorflow.py +119 -20
  23. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tensorflow.yaml +1 -1
  24. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_converter.py +34 -0
  25. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/bf16/bf16_convert.py +1 -1
  26. {neural_compressor-2.3.2/neural_compressor/adaptor/tf_utils/graph_rewriter/generic → neural_compressor-2.4/neural_compressor/adaptor/tf_utils/graph_rewriter/bf16}/dequantize_cast_optimizer.py +0 -2
  27. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/convert_add_to_biasadd.py +2 -1
  28. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fuse_pad_with_conv.py +1 -1
  29. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/insert_print_node.py +1 -1
  30. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/post_quantized_op_cse.py +1 -1
  31. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/qdq/insert_qdq_pattern.py +20 -0
  32. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_util.py +26 -1
  33. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/quantize_graph/qdq/fuse_qdq_conv.py +1 -1
  34. neural_compressor-2.4/neural_compressor/adaptor/tf_utils/smooth_quant_calibration.py +492 -0
  35. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/smooth_quant_scaler.py +113 -0
  36. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/util.py +174 -4
  37. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/torch_utils/bf16_convert.py +4 -0
  38. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/torch_utils/gptq.py +193 -66
  39. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/torch_utils/layer_wise_quant/__init__.py +1 -1
  40. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/torch_utils/layer_wise_quant/quantize.py +2 -2
  41. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/torch_utils/layer_wise_quant/torch_load.py +20 -34
  42. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/torch_utils/layer_wise_quant/utils.py +43 -17
  43. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/torch_utils/mixed_precision.py +9 -3
  44. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/torch_utils/model_wrapper.py +146 -108
  45. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/torch_utils/smooth_quant.py +349 -118
  46. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/torch_utils/util.py +133 -70
  47. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/torch_utils/weight_only.py +23 -4
  48. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/algorithm/smooth_quant.py +6 -0
  49. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/benchmark.py +2 -3
  50. neural_compressor-2.3.2/neural_compressor/experimental/common/criterion.py → neural_compressor-2.4/neural_compressor/compression/distillation/criterions.py +24 -17
  51. neural_compressor-2.3.2/neural_compressor/experimental/common/optimizer.py → neural_compressor-2.4/neural_compressor/compression/distillation/optimizers.py +1 -1
  52. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/pruner/__init__.py +1 -1
  53. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/pruner/model_slim/pattern_analyzer.py +1 -1
  54. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/pruner/patterns/ninm.py +2 -2
  55. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/pruner/pruners/progressive.py +41 -9
  56. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/pruner/pruning.py +24 -7
  57. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/pruner/utils.py +44 -18
  58. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/config.py +121 -121
  59. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/data/datasets/dataset.py +1 -1
  60. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/benchmark.py +10 -0
  61. neural_compressor-2.3.2/neural_compressor/compression/distillation/criterions.py → neural_compressor-2.4/neural_compressor/experimental/common/criterion.py +23 -401
  62. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/common/dataloader.py +3 -0
  63. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/common/metric.py +2 -0
  64. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/common/model.py +3 -0
  65. neural_compressor-2.4/neural_compressor/experimental/common/optimizer.py +205 -0
  66. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/common/postprocess.py +2 -0
  67. neural_compressor-2.4/neural_compressor/experimental/common/torch_utils.py +68 -0
  68. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/component.py +1 -0
  69. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/contrib/strategy/sigopt.py +3 -0
  70. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/contrib/strategy/tpe.py +2 -0
  71. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/data/dataloaders/base_dataloader.py +3 -0
  72. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/data/dataloaders/dataloader.py +0 -2
  73. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/data/dataloaders/default_dataloader.py +3 -1
  74. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/data/dataloaders/fetcher.py +5 -0
  75. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/data/dataloaders/mxnet_dataloader.py +3 -0
  76. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/data/dataloaders/onnxrt_dataloader.py +4 -0
  77. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/data/dataloaders/pytorch_dataloader.py +2 -2
  78. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/data/dataloaders/sampler.py +6 -0
  79. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/data/dataloaders/tensorflow_dataloader.py +6 -2
  80. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/data/datasets/dataset.py +1 -1
  81. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/distillation.py +5 -1
  82. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/export/qlinear2qdq.py +3 -0
  83. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/export/tf2onnx.py +5 -0
  84. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/export/torch2onnx.py +8 -2
  85. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/graph_optimization.py +2 -0
  86. {neural_compressor-2.3.2/neural_compressor → neural_compressor-2.4/neural_compressor/experimental}/metric/bleu.py +4 -0
  87. {neural_compressor-2.3.2/neural_compressor → neural_compressor-2.4/neural_compressor/experimental}/metric/bleu_util.py +3 -0
  88. {neural_compressor-2.3.2/neural_compressor → neural_compressor-2.4/neural_compressor/experimental}/metric/coco_tools.py +8 -0
  89. {neural_compressor-2.3.2/neural_compressor → neural_compressor-2.4/neural_compressor/experimental}/metric/evaluate_squad.py +6 -0
  90. {neural_compressor-2.3.2/neural_compressor → neural_compressor-2.4/neural_compressor/experimental}/metric/f1.py +4 -0
  91. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/metric/metric.py +33 -1
  92. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/mixed_precision.py +2 -0
  93. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/model_conversion.py +2 -0
  94. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/nas/basic_nas.py +4 -0
  95. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/nas/dynas.py +3 -0
  96. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/nas/nas.py +3 -0
  97. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/nas/nas_utils.py +4 -0
  98. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/nas/search_algorithms.py +6 -0
  99. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/pruner_legacy/gradient_sensitivity.py +2 -0
  100. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/pruner_legacy/group_lasso.py +2 -3
  101. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/pruner_legacy/magnitude.py +2 -0
  102. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/pruner_legacy/pattern_lock.py +2 -0
  103. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/pruner_legacy/pruner.py +3 -0
  104. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/pruning.py +3 -1
  105. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/pruning_recipes/patterns/pattern.py +4 -2
  106. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/pruning_recipes/patterns/tile_pattern.py +7 -0
  107. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/pruning_v2.py +3 -1
  108. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/pytorch_pruner/patterns.py +6 -2
  109. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/pytorch_pruner/prune_utils.py +7 -0
  110. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/pytorch_pruner/pruner.py +8 -0
  111. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/pytorch_pruner/pruning.py +2 -0
  112. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/pytorch_pruner/scheduler.py +7 -0
  113. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/quantization.py +1 -0
  114. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/scheduler.py +3 -0
  115. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/strategy/auto_mixed_precision.py +2 -0
  116. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/strategy/basic.py +4 -5
  117. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/strategy/bayesian.py +7 -1
  118. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/strategy/exhaustive.py +3 -0
  119. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/strategy/mse.py +3 -2
  120. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/strategy/mse_v2.py +3 -5
  121. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/strategy/random.py +2 -2
  122. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/strategy/strategy.py +5 -13
  123. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/strategy/utils/tuning_sampler.py +9 -0
  124. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/strategy/utils/tuning_space.py +8 -0
  125. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/strategy/utils/tuning_structs.py +3 -1
  126. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/strategy/utils/utility.py +6 -0
  127. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/model/model.py +8 -2
  128. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/model/onnx_model.py +368 -11
  129. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/model/tensorflow_model.py +218 -7
  130. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/model/torch_model.py +46 -3
  131. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/profiling/profiler/factory.py +1 -1
  132. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/profiling/profiler/onnxrt_profiler/factory.py +1 -1
  133. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/profiling/profiler/onnxrt_profiler/profiler.py +1 -1
  134. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/profiling/profiler/tensorflow_profiler/factory.py +1 -1
  135. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/profiling/profiler/tensorflow_profiler/profiler.py +1 -1
  136. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/quantization.py +12 -1
  137. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/strategy/auto_mixed_precision.py +1 -1
  138. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/strategy/strategy.py +30 -1
  139. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/utils/create_obj_from_config.py +2 -1
  140. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/utils/load_huggingface.py +50 -0
  141. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/utils/pytorch.py +64 -4
  142. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/utils/utility.py +5 -2
  143. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/version.py +1 -1
  144. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor.egg-info/PKG-INFO +24 -13
  145. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor.egg-info/SOURCES.txt +6 -1
  146. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor.egg-info/requires.txt +9 -0
  147. neural_compressor-2.4/setup.cfg +9 -0
  148. neural_compressor-2.4/setup.py +185 -0
  149. neural_compressor-2.4/third-party-programs.txt +1909 -0
  150. neural_compressor-2.3.2/neural_compressor/adaptor/tf_utils/smooth_quant_calibration.py +0 -225
  151. neural_compressor-2.3.2/setup.cfg +0 -4
  152. neural_compressor-2.3.2/setup.py +0 -105
  153. {neural_compressor-2.3.2 → neural_compressor-2.4}/LICENSE +0 -0
  154. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/__init__.py +0 -0
  155. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/__main__.py +0 -0
  156. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/__init__.py +0 -0
  157. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/intel_extension_for_transformers.yaml +0 -0
  158. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/keras_inc.yaml +0 -0
  159. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/nano_bf16.yaml +0 -0
  160. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/nano_bf16_channels_last.yaml +0 -0
  161. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/nano_bf16_ipex.yaml +0 -0
  162. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/nano_bf16_ipex_channels_last.yaml +0 -0
  163. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/nano_fp32_channels_last.yaml +0 -0
  164. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/nano_fp32_ipex.yaml +0 -0
  165. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/nano_fp32_ipex_channels_last.yaml +0 -0
  166. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/nano_gpu_to_cpu.yaml +0 -0
  167. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/nano_int8.yaml +0 -0
  168. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/nano_jit_bf16.yaml +0 -0
  169. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/nano_jit_bf16_channels_last.yaml +0 -0
  170. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/nano_jit_bf16_ipex.yaml +0 -0
  171. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/nano_jit_bf16_ipex_channels_last.yaml +0 -0
  172. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/nano_jit_fp32.yaml +0 -0
  173. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/nano_jit_fp32_channels_last.yaml +0 -0
  174. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/nano_jit_fp32_ipex.yaml +0 -0
  175. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/nano_jit_fp32_ipex_channels_last.yaml +0 -0
  176. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/nano_onnxruntime_fp32.yaml +0 -0
  177. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/nano_onnxruntime_int8_qlinear.yaml +0 -0
  178. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/nano_openvino_fp32.yaml +0 -0
  179. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/nano_openvino_int8.yaml +0 -0
  180. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/onnx_inc_dynamic_quant.yaml +0 -0
  181. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/onnx_inc_static_quant_qdq.yaml +0 -0
  182. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/onnx_inc_static_quant_qlinear.yaml +0 -0
  183. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/pytorch_aliblade.yaml +0 -0
  184. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/pytorch_benchmark.yaml +0 -0
  185. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/pytorch_channels_last.yaml +0 -0
  186. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/pytorch_inc_bf16.yaml +0 -0
  187. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/pytorch_inc_dynamic_quant.yaml +0 -0
  188. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/pytorch_inc_dynamic_quant_fp8.yaml +0 -0
  189. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/pytorch_inc_huggingface_optimum_dynamic.yaml +0 -0
  190. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/pytorch_inc_huggingface_optimum_static.yaml +0 -0
  191. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/pytorch_inc_static_quant_fx.yaml +0 -0
  192. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/pytorch_inc_static_quant_fx_fp8.yaml +0 -0
  193. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/pytorch_inc_static_quant_ipex.yaml +0 -0
  194. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/pytorch_ipex_bf16.yaml +0 -0
  195. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/pytorch_ipex_fp32.yaml +0 -0
  196. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/pytorch_ipex_int8_dynamic_quant.yaml +0 -0
  197. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/pytorch_ipex_int8_static_quant.yaml +0 -0
  198. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/pytorch_jit_script.yaml +0 -0
  199. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/pytorch_jit_script_ofi.yaml +0 -0
  200. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/pytorch_jit_trace.yaml +0 -0
  201. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/pytorch_jit_trace_ofi.yaml +0 -0
  202. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/pytorch_mixed_precision_cpu.yaml +0 -0
  203. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/pytorch_mixed_precision_cuda.yaml +0 -0
  204. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/pytorch_mixed_precision_intel_gpu.yaml +0 -0
  205. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/pytorch_torchdynamo_jit_script.yaml +0 -0
  206. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/pytorch_torchdynamo_jit_script_ofi.yaml +0 -0
  207. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/pytorch_torchdynamo_jit_trace.yaml +0 -0
  208. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/pytorch_torchdynamo_jit_trace_ofi.yaml +0 -0
  209. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/backends/template.yaml +0 -0
  210. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/coders/__init__.py +0 -0
  211. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/coders/autoinc/__init__.py +0 -0
  212. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/coders/autoinc/autoinc_harness.py +0 -0
  213. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/coders/autoinc/calib_dataloader.py +0 -0
  214. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/coders/autoinc/domain.py +0 -0
  215. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/coders/autoinc/eval_func.py +0 -0
  216. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/coders/pytorch/__init__.py +0 -0
  217. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/coders/pytorch/batch_size.py +0 -0
  218. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/coders/pytorch/change_trainer_to_nlptrainer.py +0 -0
  219. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/coders/pytorch/cuda_to_cpu.py +0 -0
  220. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/coders/pytorch/dummy_dataloader.py +0 -0
  221. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/coders/pytorch/harness.py +0 -0
  222. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/coders/pytorch/lightning.py +0 -0
  223. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/coders/pytorch/reclaim_inference_transformers_trainer.py +0 -0
  224. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/coders/pytorch/reclaim_inputs.py +0 -0
  225. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/coders/tensorflow/__init__.py +0 -0
  226. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/coders/tensorflow/amp.py +0 -0
  227. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/coders/tensorflow/inc.py +0 -0
  228. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/coders/transform.py +0 -0
  229. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/globals.py +0 -0
  230. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/graphers/__init__.py +0 -0
  231. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/graphers/code_line.py +0 -0
  232. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/graphers/model.py +0 -0
  233. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/graphers/preloads/__init__.py +0 -0
  234. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/graphers/preloads/transformers.yaml +0 -0
  235. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/utils/__init__.py +0 -0
  236. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/utils/common.py +0 -0
  237. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/utils/cpu_info.py +0 -0
  238. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/utils/device.py +0 -0
  239. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/utils/handle_user_input.py +0 -0
  240. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/utils/line_operation.py +0 -0
  241. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/utils/pdf_report.py +0 -0
  242. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_coder/version.py +0 -0
  243. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/__init__.py +0 -0
  244. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/__init__.py +0 -0
  245. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/adaptor.py +0 -0
  246. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/keras.yaml +0 -0
  247. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/keras_utils/__init__.py +0 -0
  248. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/keras_utils/conv2d.py +0 -0
  249. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/keras_utils/dense.py +0 -0
  250. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/keras_utils/depthwise_conv2d.py +0 -0
  251. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/keras_utils/pool2d.py +0 -0
  252. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/keras_utils/quantizer.py +0 -0
  253. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/keras_utils/separable_conv2d.py +0 -0
  254. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/mxnet.py +0 -0
  255. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/mxnet.yaml +0 -0
  256. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/mxnet_utils/__init__.py +0 -0
  257. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/mxnet_utils/util.py +0 -0
  258. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/onnxrt_cuda.yaml +0 -0
  259. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/onnxrt_dml.yaml +0 -0
  260. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/onnxrt_dnnl.yaml +0 -0
  261. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/onnxrt_trt.yaml +0 -0
  262. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/ox_utils/__init__.py +0 -0
  263. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/ox_utils/calibrator.py +0 -0
  264. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/ox_utils/operators/__init__.py +0 -0
  265. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/ox_utils/operators/activation.py +0 -0
  266. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/ox_utils/operators/argmax.py +0 -0
  267. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/ox_utils/operators/attention.py +0 -0
  268. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/ox_utils/operators/binary_op.py +0 -0
  269. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/ox_utils/operators/concat.py +0 -0
  270. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/ox_utils/operators/conv.py +0 -0
  271. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/ox_utils/operators/embed_layernorm.py +0 -0
  272. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/ox_utils/operators/gavgpool.py +0 -0
  273. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/ox_utils/operators/gemm.py +0 -0
  274. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/ox_utils/operators/matmul.py +0 -0
  275. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/ox_utils/operators/maxpool.py +0 -0
  276. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/ox_utils/operators/norm.py +0 -0
  277. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/ox_utils/operators/ops.py +0 -0
  278. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/ox_utils/operators/pad.py +0 -0
  279. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/ox_utils/operators/pooling.py +0 -0
  280. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/ox_utils/operators/reduce.py +0 -0
  281. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/ox_utils/operators/resize.py +0 -0
  282. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/ox_utils/operators/unary_op.py +0 -0
  283. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/ox_utils/quantizer.py +0 -0
  284. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/pytorch_gpu.yaml +0 -0
  285. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/query.py +0 -0
  286. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tensorflow_itex.yaml +0 -0
  287. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/__init__.py +0 -0
  288. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_converter_without_calib.py +0 -0
  289. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/__init__.py +0 -0
  290. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/bf16/__init__.py +0 -0
  291. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/__init__.py +0 -0
  292. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/convert_layout.py +0 -0
  293. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/convert_leakyrelu.py +0 -0
  294. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/convert_nan_to_random.py +0 -0
  295. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/convert_placeholder_to_const.py +0 -0
  296. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/dilated_contraction.py +0 -0
  297. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/dummy_biasadd.py +0 -0
  298. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/expanddims_optimizer.py +0 -0
  299. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fetch_weight_from_reshape.py +0 -0
  300. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fold_batch_norm.py +0 -0
  301. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fold_constant.py +0 -0
  302. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fuse_biasadd_add.py +0 -0
  303. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fuse_column_wise_mul.py +0 -0
  304. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fuse_conv_with_math.py +0 -0
  305. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fuse_decomposed_bn.py +0 -0
  306. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fuse_decomposed_in.py +0 -0
  307. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fuse_gelu.py +0 -0
  308. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fuse_layer_norm.py +0 -0
  309. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fuse_pad_with_fp32_conv.py +0 -0
  310. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/fuse_reshape_transpose.py +0 -0
  311. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/graph_cse_optimizer.py +0 -0
  312. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/grappler_pass.py +0 -0
  313. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/move_squeeze_after_relu.py +0 -0
  314. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/pre_optimize.py +0 -0
  315. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/remove_training_nodes.py +0 -0
  316. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/rename_batch_norm.py +0 -0
  317. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/split_shared_input.py +0 -0
  318. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/strip_equivalent_nodes.py +0 -0
  319. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/strip_unused_nodes.py +0 -0
  320. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/generic/switch_optimizer.py +0 -0
  321. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/graph_base.py +0 -0
  322. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/__init__.py +0 -0
  323. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/freeze_fake_quant.py +0 -0
  324. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/freeze_value.py +0 -0
  325. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/freeze_value_without_calib.py +0 -0
  326. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/fuse_conv_redundant_dequantize.py +0 -0
  327. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/fuse_conv_requantize.py +0 -0
  328. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/fuse_matmul_redundant_dequantize.py +0 -0
  329. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/fuse_matmul_requantize.py +0 -0
  330. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/meta_op_optimizer.py +0 -0
  331. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/post_hostconst_converter.py +0 -0
  332. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/rnn_convert.py +0 -0
  333. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/int8/scale_propagation.py +0 -0
  334. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/onnx/__init__.py +0 -0
  335. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/onnx/onnx_graph.py +0 -0
  336. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/onnx/onnx_node.py +0 -0
  337. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/onnx/onnx_schema.py +0 -0
  338. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/onnx/tf2onnx_utils.py +0 -0
  339. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/qdq/__init__.py +0 -0
  340. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/qdq/merge_duplicated_qdq.py +0 -0
  341. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/graph_rewriter/qdq/share_qdq_y_pattern.py +0 -0
  342. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/quantize_graph/__init__.py +0 -0
  343. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/quantize_graph/qat/__init__.py +0 -0
  344. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/quantize_graph/qat/fake_quantize.py +0 -0
  345. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/quantize_graph/qat/quantize_config.py +0 -0
  346. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/quantize_graph/qat/quantize_helper.py +0 -0
  347. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/quantize_graph/qat/quantize_layers/__init__.py +0 -0
  348. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/quantize_graph/qat/quantize_layers/optimize_layer.py +0 -0
  349. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/quantize_graph/qat/quantize_layers/quantize_layer_add.py +0 -0
  350. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/quantize_graph/qat/quantize_layers/quantize_layer_base.py +0 -0
  351. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/quantize_graph/qat/quantize_layers/quantize_layer_bn.py +0 -0
  352. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/quantize_graph/qat/quantize_wrapper.py +0 -0
  353. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/quantize_graph/qdq/__init__.py +0 -0
  354. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/quantize_graph/qdq/fuse_qdq_bn.py +0 -0
  355. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/quantize_graph/qdq/fuse_qdq_concatv2.py +0 -0
  356. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/quantize_graph/qdq/fuse_qdq_deconv.py +0 -0
  357. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/quantize_graph/qdq/fuse_qdq_in.py +0 -0
  358. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/quantize_graph/qdq/fuse_qdq_matmul.py +0 -0
  359. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/quantize_graph/qdq/fuse_qdq_pooling.py +0 -0
  360. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/quantize_graph/qdq/optimize_qdq.py +0 -0
  361. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/quantize_graph/quantize_graph_base.py +0 -0
  362. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/quantize_graph/quantize_graph_bn.py +0 -0
  363. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/quantize_graph/quantize_graph_concatv2.py +0 -0
  364. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/quantize_graph/quantize_graph_conv.py +0 -0
  365. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/quantize_graph/quantize_graph_for_intel_cpu.py +0 -0
  366. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/quantize_graph/quantize_graph_matmul.py +0 -0
  367. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/quantize_graph/quantize_graph_pooling.py +0 -0
  368. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/quantize_graph_common.py +0 -0
  369. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/tf2onnx_converter.py +0 -0
  370. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/transform_graph/__init__.py +0 -0
  371. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/transform_graph/bias_correction.py +0 -0
  372. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/transform_graph/graph_transform_base.py +0 -0
  373. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/transform_graph/insert_logging.py +0 -0
  374. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/tf_utils/transform_graph/rerange_quantized_concat.py +0 -0
  375. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/torch_utils/__init__.py +0 -0
  376. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/torch_utils/awq.py +0 -0
  377. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/torch_utils/hawq_metric.py +0 -0
  378. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/torch_utils/layer_wise_quant/modified_pickle.py +0 -0
  379. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/torch_utils/pattern_detector.py +0 -0
  380. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/torch_utils/symbolic_trace.py +0 -0
  381. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/adaptor/torch_utils/teq.py +0 -0
  382. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/algorithm/__init__.py +0 -0
  383. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/algorithm/algorithm.py +0 -0
  384. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/algorithm/fast_bias_correction.py +0 -0
  385. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/algorithm/weight_correction.py +0 -0
  386. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/__init__.py +0 -0
  387. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/callbacks.py +0 -0
  388. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/distillation/__init__.py +0 -0
  389. /neural_compressor-2.3.2/neural_compressor/experimental/common/torch_utils.py → /neural_compressor-2.4/neural_compressor/compression/distillation/utility.py +0 -0
  390. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/hpo/__init__.py +0 -0
  391. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/hpo/sa_optimizer.py +0 -0
  392. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/hpo/search_algorithms.py +0 -0
  393. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/hpo/search_space.py +0 -0
  394. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/pruner/criteria.py +0 -0
  395. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/pruner/model_slim/__init__.py +0 -0
  396. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/pruner/model_slim/auto_slim.py +0 -0
  397. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/pruner/model_slim/weight_slim.py +0 -0
  398. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/pruner/patterns/__init__.py +0 -0
  399. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/pruner/patterns/base.py +0 -0
  400. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/pruner/patterns/mha.py +0 -0
  401. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/pruner/patterns/nxm.py +0 -0
  402. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/pruner/pruners/__init__.py +0 -0
  403. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/pruner/pruners/base.py +0 -0
  404. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/pruner/pruners/basic.py +0 -0
  405. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/pruner/pruners/block_mask.py +0 -0
  406. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/pruner/pruners/mha.py +0 -0
  407. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/pruner/pruners/pattern_lock.py +0 -0
  408. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/pruner/pruners/retrain_free.py +0 -0
  409. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/pruner/pruners/sparse_gpt.py +0 -0
  410. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/pruner/regs.py +0 -0
  411. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/pruner/schedulers.py +0 -0
  412. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/compression/pruner/tf_criteria.py +0 -0
  413. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/conf/__init__.py +0 -0
  414. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/conf/config.py +0 -0
  415. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/conf/dotdict.py +0 -0
  416. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/conf/pythonic_config.py +0 -0
  417. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/contrib/__init__.py +0 -0
  418. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/contrib/strategy/__init__.py +0 -0
  419. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/contrib/strategy/sigopt.py +0 -0
  420. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/contrib/strategy/tpe.py +0 -0
  421. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/data/__init__.py +0 -0
  422. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/data/dataloaders/__init__.py +0 -0
  423. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/data/dataloaders/base_dataloader.py +0 -0
  424. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/data/dataloaders/dataloader.py +0 -0
  425. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/data/dataloaders/default_dataloader.py +0 -0
  426. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/data/dataloaders/fetcher.py +0 -0
  427. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/data/dataloaders/mxnet_dataloader.py +0 -0
  428. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/data/dataloaders/onnxrt_dataloader.py +0 -0
  429. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/data/dataloaders/pytorch_dataloader.py +0 -0
  430. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/data/dataloaders/sampler.py +0 -0
  431. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/data/dataloaders/tensorflow_dataloader.py +0 -0
  432. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/data/datasets/__init__.py +0 -0
  433. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/data/datasets/bert_dataset.py +0 -0
  434. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/data/datasets/coco_dataset.py +0 -0
  435. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/data/datasets/dummy_dataset.py +0 -0
  436. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/data/datasets/dummy_dataset_v2.py +0 -0
  437. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/data/datasets/imagenet_dataset.py +0 -0
  438. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/data/datasets/style_transfer_dataset.py +0 -0
  439. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/data/filters/__init__.py +0 -0
  440. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/data/filters/coco_filter.py +0 -0
  441. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/data/filters/filter.py +0 -0
  442. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/data/transforms/__init__.py +0 -0
  443. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/data/transforms/coco_transform.py +0 -0
  444. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/data/transforms/imagenet_transform.py +0 -0
  445. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/data/transforms/postprocess.py +0 -0
  446. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/data/transforms/tokenization.py +0 -0
  447. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/data/transforms/transform.py +0 -0
  448. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/__init__.py +0 -0
  449. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/common/__init__.py +0 -0
  450. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/compression/__init__.py +0 -0
  451. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/contrib/__init__.py +0 -0
  452. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/contrib/strategy/__init__.py +0 -0
  453. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/data/__init__.py +0 -0
  454. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/data/dataloaders/__init__.py +0 -0
  455. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/data/datasets/__init__.py +0 -0
  456. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/data/datasets/bert_dataset.py +0 -0
  457. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/data/datasets/coco_dataset.py +0 -0
  458. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/data/datasets/dummy_dataset.py +0 -0
  459. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/data/datasets/dummy_dataset_v2.py +0 -0
  460. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/data/datasets/imagenet_dataset.py +0 -0
  461. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/data/datasets/style_transfer_dataset.py +0 -0
  462. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/data/filters/__init__.py +0 -0
  463. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/data/filters/coco_filter.py +0 -0
  464. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/data/filters/filter.py +0 -0
  465. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/data/transforms/__init__.py +0 -0
  466. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/data/transforms/imagenet_transform.py +0 -0
  467. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/data/transforms/tokenization.py +0 -0
  468. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/data/transforms/transform.py +0 -0
  469. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/export/__init__.py +0 -0
  470. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/metric/__init__.py +0 -0
  471. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/metric/coco_label_map.py +0 -0
  472. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/nas/__init__.py +0 -0
  473. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/pruner_legacy/__init__.py +0 -0
  474. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/pruning_recipes/__init__.py +0 -0
  475. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/pruning_recipes/patterns/__init__.py +0 -0
  476. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/pytorch_pruner/__init__.py +0 -0
  477. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/pytorch_pruner/logger.py +0 -0
  478. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/strategy/__init__.py +0 -0
  479. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/strategy/utils/__init__.py +0 -0
  480. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/experimental/strategy/utils/constant.py +0 -0
  481. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/metric/__init__.py +0 -0
  482. {neural_compressor-2.3.2/neural_compressor/experimental → neural_compressor-2.4/neural_compressor}/metric/bleu.py +0 -0
  483. {neural_compressor-2.3.2/neural_compressor/experimental → neural_compressor-2.4/neural_compressor}/metric/bleu_util.py +0 -0
  484. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/metric/coco_label_map.py +0 -0
  485. {neural_compressor-2.3.2/neural_compressor/experimental → neural_compressor-2.4/neural_compressor}/metric/coco_tools.py +0 -0
  486. {neural_compressor-2.3.2/neural_compressor/experimental → neural_compressor-2.4/neural_compressor}/metric/evaluate_squad.py +0 -0
  487. {neural_compressor-2.3.2/neural_compressor/experimental → neural_compressor-2.4/neural_compressor}/metric/f1.py +0 -0
  488. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/metric/metric.py +0 -0
  489. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/mix_precision.py +0 -0
  490. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/model/__init__.py +0 -0
  491. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/model/base_model.py +0 -0
  492. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/model/keras_model.py +0 -0
  493. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/model/mxnet_model.py +0 -0
  494. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/model/nets_factory.py +0 -0
  495. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/objective.py +0 -0
  496. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/profiling/__init__.py +0 -0
  497. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/profiling/parser/__init__.py +0 -0
  498. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/profiling/parser/factory.py +0 -0
  499. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/profiling/parser/onnx_parser/__init__.py +0 -0
  500. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/profiling/parser/onnx_parser/factory.py +0 -0
  501. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/profiling/parser/onnx_parser/parser.py +0 -0
  502. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/profiling/parser/parser.py +0 -0
  503. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/profiling/parser/result.py +0 -0
  504. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/profiling/parser/tensorflow_parser/__init__.py +0 -0
  505. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/profiling/parser/tensorflow_parser/factory.py +0 -0
  506. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/profiling/parser/tensorflow_parser/parser.py +0 -0
  507. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/profiling/profiler/__init__.py +0 -0
  508. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/profiling/profiler/onnxrt_profiler/__init__.py +0 -0
  509. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/profiling/profiler/onnxrt_profiler/utils.py +0 -0
  510. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/profiling/profiler/profiler.py +0 -0
  511. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/profiling/profiler/tensorflow_profiler/__init__.py +0 -0
  512. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/profiling/profiler/tensorflow_profiler/utils.py +0 -0
  513. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/strategy/__init__.py +0 -0
  514. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/strategy/auto.py +0 -0
  515. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/strategy/basic.py +0 -0
  516. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/strategy/bayesian.py +0 -0
  517. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/strategy/conservative.py +0 -0
  518. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/strategy/exhaustive.py +0 -0
  519. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/strategy/hawq_v2.py +0 -0
  520. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/strategy/mse.py +0 -0
  521. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/strategy/mse_v2.py +0 -0
  522. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/strategy/random.py +0 -0
  523. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/strategy/utils/__init__.py +0 -0
  524. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/strategy/utils/constant.py +0 -0
  525. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/strategy/utils/tuning_sampler.py +0 -0
  526. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/strategy/utils/tuning_space.py +0 -0
  527. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/strategy/utils/tuning_structs.py +0 -0
  528. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/strategy/utils/utility.py +0 -0
  529. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/training.py +0 -0
  530. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/utils/__init__.py +0 -0
  531. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/utils/collect_layer_histogram.py +0 -0
  532. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/utils/constant.py +0 -0
  533. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/utils/kl_divergence.py +0 -0
  534. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/utils/logger.py +0 -0
  535. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/utils/neural_insights_utils.py +0 -0
  536. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/utils/options.py +0 -0
  537. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor/utils/weights_details.py +0 -0
  538. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor.egg-info/dependency_links.txt +0 -0
  539. {neural_compressor-2.3.2 → neural_compressor-2.4}/neural_compressor.egg-info/top_level.txt +0 -0
  540. {neural_compressor-2.3.2 → neural_compressor-2.4}/pyproject.toml +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: neural_compressor
3
- Version: 2.3.2
3
+ Version: 2.4
4
4
  Summary: Repository of Intel® Neural Compressor
5
5
  Home-page: https://github.com/intel/neural-compressor
6
6
  Author: Intel AIA Team
@@ -11,9 +11,10 @@ Classifier: Intended Audience :: Science/Research
11
11
  Classifier: Programming Language :: Python :: 3
12
12
  Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
13
13
  Classifier: License :: OSI Approved :: Apache Software License
14
- Requires-Python: >=3.6.0
14
+ Requires-Python: >=3.7.0
15
15
  Description-Content-Type: text/markdown
16
16
  License-File: LICENSE
17
+ License-File: third-party-programs.txt
17
18
  Requires-Dist: deprecated>=1.2.13
18
19
  Requires-Dist: numpy
19
20
  Requires-Dist: opencv-python-headless
@@ -28,6 +29,12 @@ Requires-Dist: pyyaml
28
29
  Requires-Dist: requests
29
30
  Requires-Dist: schema
30
31
  Requires-Dist: scikit-learn
32
+ Provides-Extra: pt
33
+ Requires-Dist: neural_compressor_3x_pt==2.4; extra == "pt"
34
+ Provides-Extra: tf
35
+ Requires-Dist: neural_compressor_3x_tf==2.4; extra == "tf"
36
+ Provides-Extra: ort
37
+ Requires-Dist: neural_compressor_3x_ort==2.4; extra == "ort"
31
38
 
32
39
  <div align="center">
33
40
 
@@ -35,8 +42,8 @@ Intel® Neural Compressor
35
42
  ===========================
36
43
  <h3> An open-source Python library supporting popular model compression techniques on all mainstream deep learning frameworks (TensorFlow, PyTorch, ONNX Runtime, and MXNet)</h3>
37
44
 
38
- [![python](https://img.shields.io/badge/python-3.7%2B-blue)](https://github.com/intel/neural-compressor)
39
- [![version](https://img.shields.io/badge/release-2.3.2-green)](https://github.com/intel/neural-compressor/releases)
45
+ [![python](https://img.shields.io/badge/python-3.8%2B-blue)](https://github.com/intel/neural-compressor)
46
+ [![version](https://img.shields.io/badge/release-2.4-green)](https://github.com/intel/neural-compressor/releases)
40
47
  [![license](https://img.shields.io/badge/license-Apache%202-blue)](https://github.com/intel/neural-compressor/blob/master/LICENSE)
41
48
  [![coverage](https://img.shields.io/badge/coverage-85%25-green)](https://github.com/intel/neural-compressor)
42
49
  [![Downloads](https://static.pepy.tech/personalized-badge/neural-compressor?period=total&units=international_system&left_color=grey&right_color=green&left_text=downloads)](https://pepy.tech/project/neural-compressor)
@@ -52,9 +59,9 @@ In particular, the tool provides the key features, typical examples, and open co
52
59
 
53
60
  * Support a wide range of Intel hardware such as [Intel Xeon Scalable Processors](https://www.intel.com/content/www/us/en/products/details/processors/xeon/scalable.html), [Intel Xeon CPU Max Series](https://www.intel.com/content/www/us/en/products/details/processors/xeon/max-series.html), [Intel Data Center GPU Flex Series](https://www.intel.com/content/www/us/en/products/details/discrete-gpus/data-center-gpu/flex-series.html), and [Intel Data Center GPU Max Series](https://www.intel.com/content/www/us/en/products/details/discrete-gpus/data-center-gpu/max-series.html) with extensive testing; support AMD CPU, ARM CPU, and NVidia GPU through ONNX Runtime with limited testing
54
61
 
55
- * Validate popular LLMs such as LLama2, [LLama](examples/onnxrt/nlp/huggingface_model/text_generation/llama/quantization/ptq_static), [MPT](https://github.com/intel/intel-extension-for-transformers/blob/main/examples/huggingface/pytorch/text-generation/quantization/README.md), [Falcon](https://github.com/intel/intel-extension-for-transformers/blob/main/examples/huggingface/pytorch/language-modeling/quantization/README.md), [GPT-J](/examples/pytorch/nlp/huggingface_models/language-modeling/quantization/ptq_static/fx), [Bloom](/examples/pytorch/nlp/huggingface_models/language-modeling/quantization/ptq_static/ipex/smooth_quant), [OPT](/examples/pytorch/nlp/huggingface_models/language-modeling/quantization/ptq_static/ipex/smooth_quant), and more than 10,000 broad models such as [Stable Diffusion](/examples/pytorch/nlp/huggingface_models/text-to-image/quantization), [BERT-Large](/examples/pytorch/nlp/huggingface_models/text-classification/quantization/ptq_static/fx), and [ResNet50](/examples/pytorch/image_recognition/torchvision_models/quantization/ptq/cpu/fx) from popular model hubs such as [Hugging Face](https://huggingface.co/), [Torch Vision](https://pytorch.org/vision/stable/index.html), and [ONNX Model Zoo](https://github.com/onnx/models#models), by leveraging zero-code optimization solution [Neural Coder](/neural_coder#what-do-we-offer) and automatic [accuracy-driven](/docs/source/design.md#workflow) quantization strategies
62
+ * Validate popular LLMs such as [LLama2](/examples/pytorch/nlp/huggingface_models/language-modeling/quantization/llm), [Falcon](/examples/pytorch/nlp/huggingface_models/language-modeling/quantization/llm), [GPT-J](/examples/pytorch/nlp/huggingface_models/language-modeling/quantization/llm), [Bloom](/examples/pytorch/nlp/huggingface_models/language-modeling/quantization/llm), [OPT](/examples/pytorch/nlp/huggingface_models/language-modeling/quantization/llm), and more than 10,000 broad models such as [Stable Diffusion](/examples/pytorch/nlp/huggingface_models/text-to-image/quantization), [BERT-Large](/examples/pytorch/nlp/huggingface_models/text-classification/quantization/ptq_static/fx), and [ResNet50](/examples/pytorch/image_recognition/torchvision_models/quantization/ptq/cpu/fx) from popular model hubs such as [Hugging Face](https://huggingface.co/), [Torch Vision](https://pytorch.org/vision/stable/index.html), and [ONNX Model Zoo](https://github.com/onnx/models#models), by leveraging zero-code optimization solution [Neural Coder](/neural_coder#what-do-we-offer) and automatic [accuracy-driven](/docs/source/design.md#workflow) quantization strategies
56
63
 
57
- * Collaborate with cloud marketplace such as [Google Cloud Platform](https://console.cloud.google.com/marketplace/product/bitnami-launchpad/inc-tensorflow-intel?project=verdant-sensor-286207), [Amazon Web Services](https://aws.amazon.com/marketplace/pp/prodview-yjyh2xmggbmga#pdp-support), and [Azure](https://azuremarketplace.microsoft.com/en-us/marketplace/apps/bitnami.inc-tensorflow-intel), software platforms such as [Alibaba Cloud](https://www.intel.com/content/www/us/en/developer/articles/technical/quantize-ai-by-oneapi-analytics-on-alibaba-cloud.html), [Tencent TACO](https://new.qq.com/rain/a/20221202A00B9S00) and [Microsoft Olive](https://github.com/microsoft/Olive), and open AI ecosystem such as [Hugging Face](https://huggingface.co/blog/intel), [PyTorch](https://pytorch.org/tutorials/recipes/intel_neural_compressor_for_pytorch.html), [ONNX](https://github.com/onnx/models#models), [ONNX Runtime](https://github.com/microsoft/onnxruntime), and [Lightning AI](https://github.com/Lightning-AI/lightning/blob/master/docs/source-pytorch/advanced/post_training_quantization.rst)
64
+ * Collaborate with cloud marketplaces such as [Google Cloud Platform](https://console.cloud.google.com/marketplace/product/bitnami-launchpad/inc-tensorflow-intel?project=verdant-sensor-286207), [Amazon Web Services](https://aws.amazon.com/marketplace/pp/prodview-yjyh2xmggbmga#pdp-support), and [Azure](https://azuremarketplace.microsoft.com/en-us/marketplace/apps/bitnami.inc-tensorflow-intel), software platforms such as [Alibaba Cloud](https://www.intel.com/content/www/us/en/developer/articles/technical/quantize-ai-by-oneapi-analytics-on-alibaba-cloud.html), [Tencent TACO](https://new.qq.com/rain/a/20221202A00B9S00) and [Microsoft Olive](https://github.com/microsoft/Olive), and open AI ecosystem such as [Hugging Face](https://huggingface.co/blog/intel), [PyTorch](https://pytorch.org/tutorials/recipes/intel_neural_compressor_for_pytorch.html), [ONNX](https://github.com/onnx/models#models), [ONNX Runtime](https://github.com/microsoft/onnxruntime), and [Lightning AI](https://github.com/Lightning-AI/lightning/blob/master/docs/source-pytorch/advanced/post_training_quantization.rst)
58
65
 
59
66
  ## Installation
60
67
 
@@ -62,7 +69,8 @@ In particular, the tool provides the key features, typical examples, and open co
62
69
  ```Shell
63
70
  pip install neural-compressor
64
71
  ```
65
- > More installation methods can be found at [Installation Guide](./docs/source/installation_guide.md). Please check out our [FAQ](./docs/source/faq.md) for more details.
72
+ > **Note**:
73
+ > More installation methods can be found at [Installation Guide](https://github.com/intel/neural-compressor/blob/master/docs/source/installation_guide.md). Please check out our [FAQ](https://github.com/intel/neural-compressor/blob/master/docs/source/faq.md) for more details.
66
74
 
67
75
  ## Getting Started
68
76
  ### Quantization with Python API
@@ -152,7 +160,8 @@ q_model = fit(
152
160
  </tr>
153
161
  <tr>
154
162
  <td colspan="4" align="center"><a href="./docs/source/quantization_weight_only.md">Weight-Only Quantization (INT8/INT4/FP4/NF4) </td>
155
- <td colspan="4" align="center"><a href="https://github.com/intel/neural-compressor/blob/fp8_adaptor/docs/source/fp8.md">FP8 Quantization </td>
163
+ <td colspan="2" align="center"><a href="https://github.com/intel/neural-compressor/blob/fp8_adaptor/docs/source/fp8.md">FP8 Quantization </td>
164
+ <td colspan="2" align="center"><a href="./docs/source/quantization_layer_wise.md">Layer-Wise Quantization </td>
156
165
  </tr>
157
166
  </tbody>
158
167
  <thead>
@@ -168,18 +177,19 @@ q_model = fit(
168
177
  </tbody>
169
178
  </table>
170
179
 
171
- > More documentations can be found at [User Guide](./docs/source/user_guide.md).
180
+ > **Note**:
181
+ > More documentations can be found at [User Guide](https://github.com/intel/neural-compressor/blob/master/docs/source/user_guide.md).
172
182
 
173
183
  ## Selected Publications/Events
184
+ * Blog by Intel: [Effective Weight-Only Quantization for Large Language Models with Intel® Neural Compressor](https://community.intel.com/t5/Blogs/Tech-Innovation/Artificial-Intelligence-AI/Effective-Weight-Only-Quantization-for-Large-Language-Models/post/1529552) (Oct 2023)
174
185
  * EMNLP'2023 (Under Review): [TEQ: Trainable Equivalent Transformation for Quantization of LLMs](https://openreview.net/forum?id=iaI8xEINAf&referrer=%5BAuthor%20Console%5D) (Sep 2023)
175
186
  * arXiv: [Efficient Post-training Quantization with FP8 Formats](https://arxiv.org/abs/2309.14592) (Sep 2023)
176
187
  * arXiv: [Optimize Weight Rounding via Signed Gradient Descent for the Quantization of LLMs](https://arxiv.org/abs/2309.05516) (Sep 2023)
177
- * Post on Social Media: [ONNXCommunityMeetup2023: INT8 Quantization for Large Language Models with Intel Neural Compressor](https://www.youtube.com/watch?v=luYBWA1Q5pQ) (July 2023)
178
- * Blog by Intel: [Accelerate Llama 2 with Intel AI Hardware and Software Optimizations](https://www.intel.com/content/www/us/en/developer/articles/news/llama2.html) (July 2023)
179
188
  * NeurIPS'2022: [Fast Distilbert on CPUs](https://arxiv.org/abs/2211.07715) (Oct 2022)
180
189
  * NeurIPS'2022: [QuaLA-MiniLM: a Quantized Length Adaptive MiniLM](https://arxiv.org/abs/2210.17114) (Oct 2022)
181
190
 
182
- > View [Full Publication List](./docs/source/publication_list.md).
191
+ > **Note**:
192
+ > View [Full Publication List](https://github.com/intel/neural-compressor/blob/master/docs/source/publication_list.md).
183
193
 
184
194
  ## Additional Content
185
195
 
@@ -189,6 +199,7 @@ q_model = fit(
189
199
  * [Security Policy](SECURITY.md)
190
200
 
191
201
  ## Communication
192
- - [GitHub Issues](https://github.com/intel/neural-compressor/issues): mainly for bugs report, new feature request, question asking, etc.
202
+ - [GitHub Issues](https://github.com/intel/neural-compressor/issues): mainly for bug reports, new feature requests, question asking, etc.
193
203
  - [Email](mailto:inc.maintainers@intel.com): welcome to raise any interesting research ideas on model compression techniques by email for collaborations.
204
+ - [Discord Channel](https://discord.com/invite/Wxk3J3ZJkU): join the discord channel for more flexible technical discussion.
194
205
  - [WeChat group](/docs/source/imgs/wechat_group.jpg): scan the QA code to join the technical discussion.
@@ -4,8 +4,8 @@ Intel® Neural Compressor
4
4
  ===========================
5
5
  <h3> An open-source Python library supporting popular model compression techniques on all mainstream deep learning frameworks (TensorFlow, PyTorch, ONNX Runtime, and MXNet)</h3>
6
6
 
7
- [![python](https://img.shields.io/badge/python-3.7%2B-blue)](https://github.com/intel/neural-compressor)
8
- [![version](https://img.shields.io/badge/release-2.3.2-green)](https://github.com/intel/neural-compressor/releases)
7
+ [![python](https://img.shields.io/badge/python-3.8%2B-blue)](https://github.com/intel/neural-compressor)
8
+ [![version](https://img.shields.io/badge/release-2.4-green)](https://github.com/intel/neural-compressor/releases)
9
9
  [![license](https://img.shields.io/badge/license-Apache%202-blue)](https://github.com/intel/neural-compressor/blob/master/LICENSE)
10
10
  [![coverage](https://img.shields.io/badge/coverage-85%25-green)](https://github.com/intel/neural-compressor)
11
11
  [![Downloads](https://static.pepy.tech/personalized-badge/neural-compressor?period=total&units=international_system&left_color=grey&right_color=green&left_text=downloads)](https://pepy.tech/project/neural-compressor)
@@ -21,9 +21,9 @@ In particular, the tool provides the key features, typical examples, and open co
21
21
 
22
22
  * Support a wide range of Intel hardware such as [Intel Xeon Scalable Processors](https://www.intel.com/content/www/us/en/products/details/processors/xeon/scalable.html), [Intel Xeon CPU Max Series](https://www.intel.com/content/www/us/en/products/details/processors/xeon/max-series.html), [Intel Data Center GPU Flex Series](https://www.intel.com/content/www/us/en/products/details/discrete-gpus/data-center-gpu/flex-series.html), and [Intel Data Center GPU Max Series](https://www.intel.com/content/www/us/en/products/details/discrete-gpus/data-center-gpu/max-series.html) with extensive testing; support AMD CPU, ARM CPU, and NVidia GPU through ONNX Runtime with limited testing
23
23
 
24
- * Validate popular LLMs such as LLama2, [LLama](examples/onnxrt/nlp/huggingface_model/text_generation/llama/quantization/ptq_static), [MPT](https://github.com/intel/intel-extension-for-transformers/blob/main/examples/huggingface/pytorch/text-generation/quantization/README.md), [Falcon](https://github.com/intel/intel-extension-for-transformers/blob/main/examples/huggingface/pytorch/language-modeling/quantization/README.md), [GPT-J](/examples/pytorch/nlp/huggingface_models/language-modeling/quantization/ptq_static/fx), [Bloom](/examples/pytorch/nlp/huggingface_models/language-modeling/quantization/ptq_static/ipex/smooth_quant), [OPT](/examples/pytorch/nlp/huggingface_models/language-modeling/quantization/ptq_static/ipex/smooth_quant), and more than 10,000 broad models such as [Stable Diffusion](/examples/pytorch/nlp/huggingface_models/text-to-image/quantization), [BERT-Large](/examples/pytorch/nlp/huggingface_models/text-classification/quantization/ptq_static/fx), and [ResNet50](/examples/pytorch/image_recognition/torchvision_models/quantization/ptq/cpu/fx) from popular model hubs such as [Hugging Face](https://huggingface.co/), [Torch Vision](https://pytorch.org/vision/stable/index.html), and [ONNX Model Zoo](https://github.com/onnx/models#models), by leveraging zero-code optimization solution [Neural Coder](/neural_coder#what-do-we-offer) and automatic [accuracy-driven](/docs/source/design.md#workflow) quantization strategies
24
+ * Validate popular LLMs such as [LLama2](/examples/pytorch/nlp/huggingface_models/language-modeling/quantization/llm), [Falcon](/examples/pytorch/nlp/huggingface_models/language-modeling/quantization/llm), [GPT-J](/examples/pytorch/nlp/huggingface_models/language-modeling/quantization/llm), [Bloom](/examples/pytorch/nlp/huggingface_models/language-modeling/quantization/llm), [OPT](/examples/pytorch/nlp/huggingface_models/language-modeling/quantization/llm), and more than 10,000 broad models such as [Stable Diffusion](/examples/pytorch/nlp/huggingface_models/text-to-image/quantization), [BERT-Large](/examples/pytorch/nlp/huggingface_models/text-classification/quantization/ptq_static/fx), and [ResNet50](/examples/pytorch/image_recognition/torchvision_models/quantization/ptq/cpu/fx) from popular model hubs such as [Hugging Face](https://huggingface.co/), [Torch Vision](https://pytorch.org/vision/stable/index.html), and [ONNX Model Zoo](https://github.com/onnx/models#models), by leveraging zero-code optimization solution [Neural Coder](/neural_coder#what-do-we-offer) and automatic [accuracy-driven](/docs/source/design.md#workflow) quantization strategies
25
25
 
26
- * Collaborate with cloud marketplace such as [Google Cloud Platform](https://console.cloud.google.com/marketplace/product/bitnami-launchpad/inc-tensorflow-intel?project=verdant-sensor-286207), [Amazon Web Services](https://aws.amazon.com/marketplace/pp/prodview-yjyh2xmggbmga#pdp-support), and [Azure](https://azuremarketplace.microsoft.com/en-us/marketplace/apps/bitnami.inc-tensorflow-intel), software platforms such as [Alibaba Cloud](https://www.intel.com/content/www/us/en/developer/articles/technical/quantize-ai-by-oneapi-analytics-on-alibaba-cloud.html), [Tencent TACO](https://new.qq.com/rain/a/20221202A00B9S00) and [Microsoft Olive](https://github.com/microsoft/Olive), and open AI ecosystem such as [Hugging Face](https://huggingface.co/blog/intel), [PyTorch](https://pytorch.org/tutorials/recipes/intel_neural_compressor_for_pytorch.html), [ONNX](https://github.com/onnx/models#models), [ONNX Runtime](https://github.com/microsoft/onnxruntime), and [Lightning AI](https://github.com/Lightning-AI/lightning/blob/master/docs/source-pytorch/advanced/post_training_quantization.rst)
26
+ * Collaborate with cloud marketplaces such as [Google Cloud Platform](https://console.cloud.google.com/marketplace/product/bitnami-launchpad/inc-tensorflow-intel?project=verdant-sensor-286207), [Amazon Web Services](https://aws.amazon.com/marketplace/pp/prodview-yjyh2xmggbmga#pdp-support), and [Azure](https://azuremarketplace.microsoft.com/en-us/marketplace/apps/bitnami.inc-tensorflow-intel), software platforms such as [Alibaba Cloud](https://www.intel.com/content/www/us/en/developer/articles/technical/quantize-ai-by-oneapi-analytics-on-alibaba-cloud.html), [Tencent TACO](https://new.qq.com/rain/a/20221202A00B9S00) and [Microsoft Olive](https://github.com/microsoft/Olive), and open AI ecosystem such as [Hugging Face](https://huggingface.co/blog/intel), [PyTorch](https://pytorch.org/tutorials/recipes/intel_neural_compressor_for_pytorch.html), [ONNX](https://github.com/onnx/models#models), [ONNX Runtime](https://github.com/microsoft/onnxruntime), and [Lightning AI](https://github.com/Lightning-AI/lightning/blob/master/docs/source-pytorch/advanced/post_training_quantization.rst)
27
27
 
28
28
  ## Installation
29
29
 
@@ -31,7 +31,8 @@ In particular, the tool provides the key features, typical examples, and open co
31
31
  ```Shell
32
32
  pip install neural-compressor
33
33
  ```
34
- > More installation methods can be found at [Installation Guide](./docs/source/installation_guide.md). Please check out our [FAQ](./docs/source/faq.md) for more details.
34
+ > **Note**:
35
+ > More installation methods can be found at [Installation Guide](https://github.com/intel/neural-compressor/blob/master/docs/source/installation_guide.md). Please check out our [FAQ](https://github.com/intel/neural-compressor/blob/master/docs/source/faq.md) for more details.
35
36
 
36
37
  ## Getting Started
37
38
  ### Quantization with Python API
@@ -121,7 +122,8 @@ q_model = fit(
121
122
  </tr>
122
123
  <tr>
123
124
  <td colspan="4" align="center"><a href="./docs/source/quantization_weight_only.md">Weight-Only Quantization (INT8/INT4/FP4/NF4) </td>
124
- <td colspan="4" align="center"><a href="https://github.com/intel/neural-compressor/blob/fp8_adaptor/docs/source/fp8.md">FP8 Quantization </td>
125
+ <td colspan="2" align="center"><a href="https://github.com/intel/neural-compressor/blob/fp8_adaptor/docs/source/fp8.md">FP8 Quantization </td>
126
+ <td colspan="2" align="center"><a href="./docs/source/quantization_layer_wise.md">Layer-Wise Quantization </td>
125
127
  </tr>
126
128
  </tbody>
127
129
  <thead>
@@ -137,18 +139,19 @@ q_model = fit(
137
139
  </tbody>
138
140
  </table>
139
141
 
140
- > More documentations can be found at [User Guide](./docs/source/user_guide.md).
142
+ > **Note**:
143
+ > More documentations can be found at [User Guide](https://github.com/intel/neural-compressor/blob/master/docs/source/user_guide.md).
141
144
 
142
145
  ## Selected Publications/Events
146
+ * Blog by Intel: [Effective Weight-Only Quantization for Large Language Models with Intel® Neural Compressor](https://community.intel.com/t5/Blogs/Tech-Innovation/Artificial-Intelligence-AI/Effective-Weight-Only-Quantization-for-Large-Language-Models/post/1529552) (Oct 2023)
143
147
  * EMNLP'2023 (Under Review): [TEQ: Trainable Equivalent Transformation for Quantization of LLMs](https://openreview.net/forum?id=iaI8xEINAf&referrer=%5BAuthor%20Console%5D) (Sep 2023)
144
148
  * arXiv: [Efficient Post-training Quantization with FP8 Formats](https://arxiv.org/abs/2309.14592) (Sep 2023)
145
149
  * arXiv: [Optimize Weight Rounding via Signed Gradient Descent for the Quantization of LLMs](https://arxiv.org/abs/2309.05516) (Sep 2023)
146
- * Post on Social Media: [ONNXCommunityMeetup2023: INT8 Quantization for Large Language Models with Intel Neural Compressor](https://www.youtube.com/watch?v=luYBWA1Q5pQ) (July 2023)
147
- * Blog by Intel: [Accelerate Llama 2 with Intel AI Hardware and Software Optimizations](https://www.intel.com/content/www/us/en/developer/articles/news/llama2.html) (July 2023)
148
150
  * NeurIPS'2022: [Fast Distilbert on CPUs](https://arxiv.org/abs/2211.07715) (Oct 2022)
149
151
  * NeurIPS'2022: [QuaLA-MiniLM: a Quantized Length Adaptive MiniLM](https://arxiv.org/abs/2210.17114) (Oct 2022)
150
152
 
151
- > View [Full Publication List](./docs/source/publication_list.md).
153
+ > **Note**:
154
+ > View [Full Publication List](https://github.com/intel/neural-compressor/blob/master/docs/source/publication_list.md).
152
155
 
153
156
  ## Additional Content
154
157
 
@@ -158,6 +161,7 @@ q_model = fit(
158
161
  * [Security Policy](SECURITY.md)
159
162
 
160
163
  ## Communication
161
- - [GitHub Issues](https://github.com/intel/neural-compressor/issues): mainly for bugs report, new feature request, question asking, etc.
164
+ - [GitHub Issues](https://github.com/intel/neural-compressor/issues): mainly for bug reports, new feature requests, question asking, etc.
162
165
  - [Email](mailto:inc.maintainers@intel.com): welcome to raise any interesting research ideas on model compression techniques by email for collaborations.
166
+ - [Discord Channel](https://discord.com/invite/Wxk3J3ZJkU): join the discord channel for more flexible technical discussion.
163
167
  - [WeChat group](/docs/source/imgs/wechat_group.jpg): scan the QA code to join the technical discussion.
@@ -0,0 +1,34 @@
1
+ # Copyright (c) 2023 Intel Corporation
2
+ #
3
+ # Licensed under the Apache License, Version 2.0 (the "License");
4
+ # you may not use this file except in compliance with the License.
5
+ # You may obtain a copy of the License at
6
+ #
7
+ # http://www.apache.org/licenses/LICENSE-2.0
8
+ #
9
+ # Unless required by applicable law or agreed to in writing, software
10
+ # distributed under the License is distributed on an "AS IS" BASIS,
11
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12
+ # See the License for the specific language governing permissions and
13
+ # limitations under the License.
14
+
15
+ transformation:
16
+ location:
17
+ - ["insert_below_dataloader_definition_line", "insert_below_model_definition_line"]
18
+ content:
19
+ - |-
20
+ [+] from neural_compressor.config import PostTrainingQuantConfig
21
+ [+] from neural_compressor.quantization import fit
22
+ [+] MODEL_NAME = MODEL_NAME.to("xpu")
23
+ [+] conf = PostTrainingQuantConfig(backend='ipex', quant_level=1, device="xpu")
24
+ [+] MODEL_NAME = fit(model=MODEL_NAME, conf=conf, calib_dataloader=DATALOADER_NAME)
25
+ [+] MODEL_NAME.save("./quantized_model")
26
+ [+] MODEL_NAME.eval()
27
+ order:
28
+ - below:
29
+ above:
30
+ - pytorch_jit_script
31
+ - pytorch_jit_script_ofi
32
+ - pytorch_jit_trace
33
+ - pytorch_jit_trace_ofi
34
+ - pytorch_channels_last
@@ -56,7 +56,7 @@ def register_func_wrap_pair():
56
56
  if is_in_function and line_idx == func_end_line_idx:
57
57
  is_in_function = False
58
58
 
59
- # handle function's defnition line, to initiate a function
59
+ # handle function's definition line, to initiate a function
60
60
  if not is_in_function and "def " in line: # only deal with outermost def
61
61
  function_name = line[line.find("def") + 4 : line.find("(")]
62
62
 
@@ -118,6 +118,7 @@ def enable(
118
118
  "pytorch_inc_dynamic_quant",
119
119
  "pytorch_inc_static_quant_fx",
120
120
  "pytorch_inc_static_quant_ipex",
121
+ "pytorch_inc_static_quant_ipex_xpu",
121
122
  "pytorch_inc_bf16",
122
123
  "pytorch_inc_huggingface_optimum_static",
123
124
  "pytorch_inc_huggingface_optimum_dynamic",
@@ -210,6 +211,7 @@ def enable(
210
211
  or "pytorch_jit_trace_ofi" in features
211
212
  or "pytorch_inc_static_quant_fx" in features
212
213
  or "pytorch_inc_static_quant_ipex" in features
214
+ or "pytorch_inc_static_quant_ipex_xpu" in features
213
215
  ):
214
216
  features = ["pytorch_reclaim_inputs"] + features
215
217
 
@@ -312,6 +314,7 @@ def enable(
312
314
  "pytorch_inc_dynamic_quant",
313
315
  "pytorch_inc_static_quant_fx",
314
316
  "pytorch_inc_static_quant_ipex",
317
+ "pytorch_inc_static_quant_ipex_xpu",
315
318
  "pytorch_inc_huggingface_optimum_static",
316
319
  "pytorch_inc_huggingface_optimum_dynamic",
317
320
  "onnx_inc_static_quant_qlinear",
@@ -839,6 +842,7 @@ def superbench(
839
842
  ["pytorch_inc_dynamic_quant"],
840
843
  ["pytorch_inc_static_quant_fx"],
841
844
  ["pytorch_inc_static_quant_ipex"],
845
+ ["pytorch_inc_static_quant_ipex_xpu"],
842
846
  ["pytorch_inc_bf16"],
843
847
  ]
844
848
  standalones_pool = []
@@ -857,12 +861,14 @@ def superbench(
857
861
  "pytorch_ipex_bf16",
858
862
  "pytorch_inc_static_quant_fx",
859
863
  "pytorch_inc_static_quant_ipex",
864
+ "pytorch_inc_static_quant_ipex_xpu",
860
865
  "pytorch_inc_dynamic_quant",
861
866
  "pytorch_ipex_int8_static_quant",
862
867
  "pytorch_ipex_int8_dynamic_quant",
863
868
  ]
864
869
  # features that can be standalone (either use alone or use with "backend"):
865
870
  standalones_pool = [
871
+ "pytorch_ipex_xpu",
866
872
  "pytorch_mixed_precision_cpu",
867
873
  "pytorch_channels_last",
868
874
  ]
@@ -906,6 +912,8 @@ def superbench(
906
912
  continue
907
913
  if "pytorch_inc_static_quant_ipex" in features and "pytorch_mixed_precision_cpu" in features:
908
914
  continue
915
+ if "pytorch_inc_static_quant_ipex_xpu" in features and "pytorch_mixed_precision_cpu" in features:
916
+ continue
909
917
  if "pytorch_inc_dynamic_quant" in features and "pytorch_mixed_precision_cpu" in features:
910
918
  continue
911
919
 
@@ -960,6 +968,8 @@ def superbench(
960
968
  features_display = "Intel INT8 (Static)"
961
969
  elif features == ["pytorch_inc_static_quant_ipex"]:
962
970
  features_display = "Intel INT8 (IPEX)"
971
+ elif features == ["pytorch_inc_static_quant_ipex_xpu"]:
972
+ features_display = "Intel INT8 (IPEX XPU)"
963
973
  elif features == ["pytorch_inc_bf16"]:
964
974
  features_display = "Intel BF16"
965
975
  elif features == []:
@@ -1047,6 +1057,8 @@ def superbench(
1047
1057
  best_optimization_display = "Intel INT8 (Static)"
1048
1058
  elif list_optimization_set_top3[0] == ["pytorch_inc_static_quant_ipex"]:
1049
1059
  best_optimization_display = "Intel INT8 (IPEX)"
1060
+ elif list_optimization_set_top3[0] == ["pytorch_inc_static_quant_ipex_xpu"]:
1061
+ best_optimization_display = "Intel INT8 (IPEX XPU)"
1050
1062
  elif list_optimization_set_top3[0] == ["pytorch_inc_bf16"]:
1051
1063
  best_optimization_display = "Intel BF16"
1052
1064
  elif list_optimization_set_top3[0] == []:
@@ -57,6 +57,8 @@ class Launcher:
57
57
  args.opt = "pytorch_inc_static_quant_fx"
58
58
  if args.approach == "static_ipex":
59
59
  args.opt = "pytorch_inc_static_quant_ipex"
60
+ if args.approach == "static_ipex_xpu":
61
+ args.opt = "pytorch_inc_static_quant_ipex_xpu"
60
62
  if args.approach == "dynamic":
61
63
  args.opt = "pytorch_inc_dynamic_quant"
62
64
  if args.approach == "auto":
@@ -34,7 +34,7 @@ logger = logging.getLogger(__name__)
34
34
 
35
35
 
36
36
  class CPUinfo:
37
- """Get CPU inforamation, such as cores list and NUMA information."""
37
+ """Get CPU information, such as cores list and NUMA information."""
38
38
 
39
39
  def __init__(self):
40
40
  self.cpuinfo = []
@@ -460,7 +460,7 @@ class MultiInstanceLauncher(Launcher):
460
460
 
461
461
 
462
462
  class DistributedTrainingLauncher(Launcher):
463
- r"""Launcher for distributed traning with MPI launcher."""
463
+ r"""Launcher for distributed training with MPI launcher."""
464
464
 
465
465
  def get_mpi_pin_domain(self, nproc_per_node, ccl_worker_count, total_cores):
466
466
  """I_MPI_PIN_DOMAIN specify the cores used for every MPI process.
@@ -867,7 +867,7 @@ class KerasAdaptor(Adaptor):
867
867
  for i in range(len(list_len_dataloader) - 1):
868
868
  if list_len_dataloader[i] != list_len_dataloader[i + 1]:
869
869
  raise AttributeError(
870
- "The traning dataloader's iteration is"
870
+ "The training dataloader's iteration is"
871
871
  "different between processes, please reset dataloader's batch_size."
872
872
  )
873
873