compressed-tensors 0.12.3a20251007__tar.gz → 0.12.3a20251008__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (156) hide show
  1. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/PKG-INFO +1 -1
  2. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/quantization/quant_args.py +10 -1
  3. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/version.py +1 -1
  4. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors.egg-info/PKG-INFO +1 -1
  5. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/test_utils/test_helpers.py +13 -7
  6. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/.github/.gitkeep +0 -0
  7. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/.github/actions/test/action.yml +0 -0
  8. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/.github/scripts/step-status +0 -0
  9. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/.github/workflows/build-test.yml +0 -0
  10. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/.github/workflows/build.yml +0 -0
  11. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/.github/workflows/post-release-nightly-build.yml +0 -0
  12. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/.github/workflows/quality-check.yaml +0 -0
  13. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/.github/workflows/report.yml +0 -0
  14. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/.github/workflows/test-check.yaml +0 -0
  15. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/.github/workflows/test.yml +0 -0
  16. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/.github/workflows/trigger-all.yml +0 -0
  17. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/.github/workflows/upload.yml +0 -0
  18. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/.gitignore +0 -0
  19. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/LICENSE +0 -0
  20. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/Makefile +0 -0
  21. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/README.md +0 -0
  22. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/examples/bit_packing/ex_quantize_and_pack.py +0 -0
  23. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/examples/bit_packing/int4_config.json +0 -0
  24. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/examples/bitmask_compression.ipynb +0 -0
  25. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/examples/llama_1.1b/ex_config_quantization.py +0 -0
  26. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/examples/llama_1.1b/ex_llmcompressor_quantization.py +0 -0
  27. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/examples/llama_1.1b/example_quant_config.json +0 -0
  28. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/examples/llama_1.1b/example_quant_recipe.yaml +0 -0
  29. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/examples/quantize_and_pack_int4.ipynb +0 -0
  30. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/pyproject.toml +0 -0
  31. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/setup.cfg +0 -0
  32. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/setup.py +0 -0
  33. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/__init__.py +0 -0
  34. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/README.md +0 -0
  35. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/__init__.py +0 -0
  36. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/base.py +0 -0
  37. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/__init__.py +0 -0
  38. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/base.py +0 -0
  39. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/helpers.py +0 -0
  40. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/model_compressors/__init__.py +0 -0
  41. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/model_compressors/model_compressor.py +0 -0
  42. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/quantized_compressors/__init__.py +0 -0
  43. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/quantized_compressors/base.py +0 -0
  44. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/quantized_compressors/naive_quantized.py +0 -0
  45. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/quantized_compressors/nvfp4_quantized.py +0 -0
  46. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/quantized_compressors/pack_quantized.py +0 -0
  47. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/sparse_compressors/__init__.py +0 -0
  48. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/sparse_compressors/base.py +0 -0
  49. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/sparse_compressors/dense.py +0 -0
  50. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/sparse_compressors/sparse_24_bitmask.py +0 -0
  51. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/sparse_compressors/sparse_bitmask.py +0 -0
  52. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/sparse_quantized_compressors/__init__.py +0 -0
  53. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/sparse_quantized_compressors/marlin_24.py +0 -0
  54. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/config/__init__.py +0 -0
  55. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/config/base.py +0 -0
  56. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/config/dense.py +0 -0
  57. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/config/format.py +0 -0
  58. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/config/sparse_24_bitmask.py +0 -0
  59. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/config/sparse_bitmask.py +0 -0
  60. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/linear/__init__.py +0 -0
  61. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/linear/compressed_linear.py +0 -0
  62. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/logger.py +0 -0
  63. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/quantization/__init__.py +0 -0
  64. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/quantization/lifecycle/__init__.py +0 -0
  65. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/quantization/lifecycle/apply.py +0 -0
  66. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/quantization/lifecycle/compressed.py +0 -0
  67. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/quantization/lifecycle/forward.py +0 -0
  68. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/quantization/lifecycle/helpers.py +0 -0
  69. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/quantization/lifecycle/initialize.py +0 -0
  70. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/quantization/quant_config.py +0 -0
  71. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/quantization/quant_metadata.py +0 -0
  72. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/quantization/quant_scheme.py +0 -0
  73. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/quantization/utils/__init__.py +0 -0
  74. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/quantization/utils/helpers.py +0 -0
  75. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/registry/__init__.py +0 -0
  76. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/registry/registry.py +0 -0
  77. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/transform/__init__.py +0 -0
  78. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/transform/apply.py +0 -0
  79. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/transform/factory/__init__.py +0 -0
  80. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/transform/factory/base.py +0 -0
  81. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/transform/factory/hadamard.py +0 -0
  82. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/transform/factory/matrix_multiply.py +0 -0
  83. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/transform/factory/random_hadamard.py +0 -0
  84. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/transform/transform_args.py +0 -0
  85. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/transform/transform_config.py +0 -0
  86. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/transform/transform_scheme.py +0 -0
  87. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/transform/utils/__init__.py +0 -0
  88. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/transform/utils/hadamard.py +0 -0
  89. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/transform/utils/hadamards.safetensors +0 -0
  90. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/transform/utils/matrix.py +0 -0
  91. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/utils/__init__.py +0 -0
  92. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/utils/helpers.py +0 -0
  93. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/utils/internal.py +0 -0
  94. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/utils/match.py +0 -0
  95. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/utils/offload.py +0 -0
  96. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/utils/permutations_24.py +0 -0
  97. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/utils/safetensors_load.py +0 -0
  98. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/utils/semi_structured_conversions.py +0 -0
  99. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/utils/type.py +0 -0
  100. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors.egg-info/SOURCES.txt +0 -0
  101. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors.egg-info/dependency_links.txt +0 -0
  102. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors.egg-info/requires.txt +0 -0
  103. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors.egg-info/top_level.txt +0 -0
  104. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/__init__.py +0 -0
  105. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/conftest.py +0 -0
  106. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_compressors/__init__.py +0 -0
  107. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_compressors/model_compressors/__init__.py +0 -0
  108. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_compressors/model_compressors/test_model_compressor.py +0 -0
  109. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_compressors/quantized_compressors/__init__.py +0 -0
  110. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_compressors/quantized_compressors/test_fp8_quant.py +0 -0
  111. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_compressors/quantized_compressors/test_int_quant.py +0 -0
  112. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_compressors/quantized_compressors/test_nvfp4_quant.py +0 -0
  113. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_compressors/quantized_compressors/test_pack_quant.py +0 -0
  114. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_compressors/sparse_compressors/__init__.py +0 -0
  115. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_compressors/sparse_compressors/test_bitmask.py +0 -0
  116. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_compressors/sparse_compressors/test_sparse_24_bitmask.py +0 -0
  117. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_compressors/sparse_quantized_compressors/__init__.py +0 -0
  118. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_compressors/sparse_quantized_compressors/test_marlin_24.py +0 -0
  119. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_configs/__init__.py +0 -0
  120. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_configs/test_base.py +0 -0
  121. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_configs/test_infer_quant.py +0 -0
  122. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_examples/test_bitmask_compression_ipynb.py +0 -0
  123. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_linear/__init__.py +0 -0
  124. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_linear/test_compressed_linear.py +0 -0
  125. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/__init__.py +0 -0
  126. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/lifecycle/__init__.py +0 -0
  127. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/lifecycle/conftest.py +0 -0
  128. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/lifecycle/test_apply.py +0 -0
  129. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/lifecycle/test_dynamic_lifecycle.py +0 -0
  130. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/lifecycle/test_enabled.py +0 -0
  131. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/lifecycle/test_forward.py +0 -0
  132. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/lifecycle/test_initialize.py +0 -0
  133. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/lifecycle/test_lifecycle.py +0 -0
  134. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/test_configs/__init__.py +0 -0
  135. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/test_configs/test_bit_depths.py +0 -0
  136. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/test_configs/test_strategies.py +0 -0
  137. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/test_quant_args.py +0 -0
  138. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/test_quant_config.py +0 -0
  139. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/test_quant_scheme.py +0 -0
  140. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_registry.py +0 -0
  141. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_transform/conftest.py +0 -0
  142. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_transform/factory/test_correctness.py +0 -0
  143. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_transform/factory/test_memory.py +0 -0
  144. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_transform/factory/test_serialization.py +0 -0
  145. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_transform/test_transform_args.py +0 -0
  146. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_transform/test_transform_config.py +0 -0
  147. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_transform/test_transform_scheme.py +0 -0
  148. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_transform/utils/test_hadamard.py +0 -0
  149. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_utils/__init__.py +0 -0
  150. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_utils/test_helpers.py +0 -0
  151. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_utils/test_match.py +0 -0
  152. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_utils/test_offload.py +0 -0
  153. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_utils/test_safetensors_load.py +0 -0
  154. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_utils/test_type.py +0 -0
  155. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/testing_utils.py +0 -0
  156. {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/utils/copyright.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: compressed-tensors
3
- Version: 0.12.3a20251007
3
+ Version: 0.12.3a20251008
4
4
  Summary: Library for utilization of compressed safetensors of neural network models
5
5
  Home-page: https://github.com/neuralmagic/compressed-tensors
6
6
  Author: Neuralmagic, Inc.
@@ -259,6 +259,7 @@ class QuantizationArgs(BaseModel, use_enum_values=True):
259
259
  # extract user-passed values from dictionary
260
260
  strategy = model.strategy
261
261
  group_size = model.group_size
262
+ block_structure = model.block_structure
262
263
  actorder = model.actorder
263
264
  dynamic = model.dynamic
264
265
  observer = model.observer
@@ -277,7 +278,7 @@ class QuantizationArgs(BaseModel, use_enum_values=True):
277
278
  "strategy='group' and group_size = -1 for 'channel'"
278
279
  )
279
280
 
280
- # validate strategy and group
281
+ # validate group strategy
281
282
  if strategy == QuantizationStrategy.GROUP:
282
283
  if group_size is None or group_size <= 0:
283
284
  raise ValueError(
@@ -292,6 +293,14 @@ class QuantizationArgs(BaseModel, use_enum_values=True):
292
293
  ):
293
294
  raise ValueError("group_size requires strategy to be set to 'group'")
294
295
 
296
+ # validate block strategy
297
+ has_block_strategy = strategy == QuantizationStrategy.BLOCK
298
+ has_block_structure = block_structure is not None
299
+ if has_block_strategy and not has_block_structure:
300
+ raise ValueError(f"Block strategy requires block structure\n{model}")
301
+ if has_block_structure and not has_block_strategy:
302
+ raise ValueError(f"Block structure requires block strategy\n{model}")
303
+
295
304
  # validate activation ordering and strategy
296
305
  if actorder is not None and strategy != QuantizationStrategy.GROUP:
297
306
  raise ValueError(
@@ -17,5 +17,5 @@ __version__: str
17
17
  __version_tuple__: VERSION_TUPLE
18
18
  version_tuple: VERSION_TUPLE
19
19
 
20
- __version__ = version = '0.12.3.a20251007'
20
+ __version__ = version = '0.12.3.a20251008'
21
21
  __version_tuple__ = version_tuple = (0, 12, 3)
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: compressed-tensors
3
- Version: 0.12.3a20251007
3
+ Version: 0.12.3a20251008
4
4
  Summary: Library for utilization of compressed safetensors of neural network models
5
5
  Home-page: https://github.com/neuralmagic/compressed-tensors
6
6
  Author: Neuralmagic, Inc.
@@ -32,36 +32,42 @@ from compressed_tensors.quantization.utils import (
32
32
  [
33
33
  (
34
34
  False,
35
- QuantizationStrategy.TENSOR,
35
+ "tensor",
36
36
  torch.Size(
37
37
  [
38
38
  1,
39
39
  ]
40
40
  ),
41
41
  ),
42
- (True, QuantizationStrategy.CHANNEL, torch.Size([1, 1])),
43
- (True, QuantizationStrategy.GROUP, torch.Size([1, 1])),
42
+ (True, "channel", torch.Size([1, 1])),
43
+ (True, "group", torch.Size([1, 1])),
44
44
  (
45
45
  False,
46
- QuantizationStrategy.BLOCK,
46
+ "block",
47
47
  torch.Size(
48
48
  [
49
49
  1,
50
50
  ]
51
51
  ),
52
52
  ),
53
- (True, QuantizationStrategy.TOKEN, torch.Size([1, 1])),
53
+ (True, "token", torch.Size([1, 1])),
54
54
  ],
55
55
  )
56
56
  def test_calculate_qparams(keepdims, strategy, exp_shape):
57
- value = torch.randn(14, 5)
57
+ value = torch.empty(5, 6)
58
58
  min_val = torch.amin(value, dim=tuple(), keepdims=keepdims)
59
59
  max_val = torch.amax(value, dim=tuple(), keepdims=keepdims)
60
60
 
61
61
  if strategy == QuantizationStrategy.GROUP:
62
62
  args = QuantizationArgs(strategy=strategy, group_size=2)
63
+ elif strategy == QuantizationStrategy.BLOCK:
64
+ args = QuantizationArgs(strategy=strategy, block_structure=[1, 3])
63
65
  else:
64
- args = QuantizationArgs(strategy=strategy)
66
+ args = QuantizationArgs(
67
+ strategy=strategy,
68
+ group_size=(2 if strategy == "group" else None),
69
+ block_structure=([1, 3] if strategy == "block" else None),
70
+ )
65
71
  scale, zp = calculate_qparams(min_val, max_val, args)
66
72
  assert scale.shape == exp_shape
67
73
  assert zp.shape == exp_shape