compressed-tensors 0.10.3a20250728__tar.gz → 0.10.3a20250731__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (149) hide show
  1. {compressed_tensors-0.10.3a20250728/src/compressed_tensors.egg-info → compressed_tensors-0.10.3a20250731}/PKG-INFO +1 -1
  2. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/compressors/quantized_compressors/nvfp4_quantized.py +21 -0
  3. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/quantization/lifecycle/forward.py +7 -19
  4. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/quantization/utils/helpers.py +7 -11
  5. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/version.py +1 -1
  6. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731/src/compressed_tensors.egg-info}/PKG-INFO +1 -1
  7. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_quantization/test_utils/test_helpers.py +1 -1
  8. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/.github/.gitkeep +0 -0
  9. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/.github/actions/test/action.yml +0 -0
  10. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/.github/scripts/step-status +0 -0
  11. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/.github/workflows/build-test.yml +0 -0
  12. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/.github/workflows/build.yml +0 -0
  13. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/.github/workflows/report.yml +0 -0
  14. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/.github/workflows/test-check.yaml +0 -0
  15. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/.github/workflows/test.yml +0 -0
  16. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/.github/workflows/trigger-all.yml +0 -0
  17. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/.github/workflows/upload.yml +0 -0
  18. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/.gitignore +0 -0
  19. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/LICENSE +0 -0
  20. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/Makefile +0 -0
  21. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/README.md +0 -0
  22. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/examples/bit_packing/ex_quantize_and_pack.py +0 -0
  23. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/examples/bit_packing/int4_config.json +0 -0
  24. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/examples/bitmask_compression.ipynb +0 -0
  25. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/examples/llama_1.1b/ex_config_quantization.py +0 -0
  26. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/examples/llama_1.1b/ex_llmcompressor_quantization.py +0 -0
  27. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/examples/llama_1.1b/example_quant_config.json +0 -0
  28. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/examples/llama_1.1b/example_quant_recipe.yaml +0 -0
  29. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/examples/quantize_and_pack_int4.ipynb +0 -0
  30. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/pyproject.toml +0 -0
  31. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/setup.cfg +0 -0
  32. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/setup.py +0 -0
  33. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/__init__.py +0 -0
  34. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/README.md +0 -0
  35. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/__init__.py +0 -0
  36. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/base.py +0 -0
  37. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/compressors/__init__.py +0 -0
  38. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/compressors/base.py +0 -0
  39. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/compressors/helpers.py +0 -0
  40. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/compressors/model_compressors/__init__.py +0 -0
  41. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/compressors/model_compressors/model_compressor.py +0 -0
  42. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/compressors/quantized_compressors/__init__.py +0 -0
  43. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/compressors/quantized_compressors/base.py +0 -0
  44. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/compressors/quantized_compressors/naive_quantized.py +0 -0
  45. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/compressors/quantized_compressors/pack_quantized.py +0 -0
  46. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/compressors/sparse_compressors/__init__.py +0 -0
  47. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/compressors/sparse_compressors/base.py +0 -0
  48. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/compressors/sparse_compressors/dense.py +0 -0
  49. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/compressors/sparse_compressors/sparse_24_bitmask.py +0 -0
  50. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/compressors/sparse_compressors/sparse_bitmask.py +0 -0
  51. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/compressors/sparse_quantized_compressors/__init__.py +0 -0
  52. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/compressors/sparse_quantized_compressors/marlin_24.py +0 -0
  53. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/config/__init__.py +0 -0
  54. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/config/base.py +0 -0
  55. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/config/dense.py +0 -0
  56. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/config/sparse_24_bitmask.py +0 -0
  57. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/config/sparse_bitmask.py +0 -0
  58. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/linear/__init__.py +0 -0
  59. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/linear/compressed_linear.py +0 -0
  60. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/quantization/__init__.py +0 -0
  61. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/quantization/lifecycle/__init__.py +0 -0
  62. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/quantization/lifecycle/apply.py +0 -0
  63. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/quantization/lifecycle/compressed.py +0 -0
  64. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/quantization/lifecycle/helpers.py +0 -0
  65. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/quantization/lifecycle/initialize.py +0 -0
  66. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/quantization/quant_args.py +0 -0
  67. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/quantization/quant_config.py +0 -0
  68. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/quantization/quant_scheme.py +0 -0
  69. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/quantization/utils/__init__.py +0 -0
  70. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/registry/__init__.py +0 -0
  71. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/registry/registry.py +0 -0
  72. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/transform/__init__.py +0 -0
  73. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/transform/apply.py +0 -0
  74. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/transform/factory/__init__.py +0 -0
  75. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/transform/factory/base.py +0 -0
  76. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/transform/factory/hadamard.py +0 -0
  77. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/transform/factory/matrix_multiply.py +0 -0
  78. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/transform/factory/random_hadamard.py +0 -0
  79. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/transform/transform_args.py +0 -0
  80. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/transform/transform_config.py +0 -0
  81. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/transform/transform_scheme.py +0 -0
  82. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/transform/utils/__init__.py +0 -0
  83. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/transform/utils/hadamard.py +0 -0
  84. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/transform/utils/hadamards.safetensors +0 -0
  85. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/transform/utils/matrix.py +0 -0
  86. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/utils/__init__.py +0 -0
  87. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/utils/helpers.py +0 -0
  88. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/utils/internal.py +0 -0
  89. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/utils/match.py +0 -0
  90. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/utils/offload.py +0 -0
  91. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/utils/permutations_24.py +0 -0
  92. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/utils/permute.py +0 -0
  93. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/utils/safetensors_load.py +0 -0
  94. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors/utils/semi_structured_conversions.py +0 -0
  95. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors.egg-info/SOURCES.txt +0 -0
  96. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors.egg-info/dependency_links.txt +0 -0
  97. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors.egg-info/requires.txt +0 -0
  98. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/src/compressed_tensors.egg-info/top_level.txt +0 -0
  99. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/__init__.py +0 -0
  100. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/conftest.py +0 -0
  101. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_compressors/__init__.py +0 -0
  102. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_compressors/model_compressors/__init__.py +0 -0
  103. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_compressors/model_compressors/test_model_compressor.py +0 -0
  104. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_compressors/quantized_compressors/__init__.py +0 -0
  105. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_compressors/quantized_compressors/test_fp8_quant.py +0 -0
  106. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_compressors/quantized_compressors/test_int_quant.py +0 -0
  107. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_compressors/quantized_compressors/test_nvfp4_quant.py +0 -0
  108. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_compressors/quantized_compressors/test_pack_quant.py +0 -0
  109. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_compressors/sparse_compressors/__init__.py +0 -0
  110. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_compressors/sparse_compressors/test_bitmask.py +0 -0
  111. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_compressors/sparse_compressors/test_sparse_24_bitmask.py +0 -0
  112. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_compressors/sparse_quantized_compressors/__init__.py +0 -0
  113. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_compressors/sparse_quantized_compressors/test_marlin_24.py +0 -0
  114. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_configs/__init__.py +0 -0
  115. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_configs/test_base.py +0 -0
  116. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_examples/test_bitmask_compression_ipynb.py +0 -0
  117. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_linear/__init__.py +0 -0
  118. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_linear/test_compressed_linear.py +0 -0
  119. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_quantization/__init__.py +0 -0
  120. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_quantization/lifecycle/__init__.py +0 -0
  121. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_quantization/lifecycle/conftest.py +0 -0
  122. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_quantization/lifecycle/test_apply.py +0 -0
  123. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_quantization/lifecycle/test_dynamic_lifecycle.py +0 -0
  124. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_quantization/lifecycle/test_enabled.py +0 -0
  125. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_quantization/lifecycle/test_forward.py +0 -0
  126. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_quantization/lifecycle/test_helpers.py +0 -0
  127. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_quantization/lifecycle/test_initialize.py +0 -0
  128. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_quantization/lifecycle/test_lifecycle.py +0 -0
  129. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_quantization/test_configs/__init__.py +0 -0
  130. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_quantization/test_configs/test_bit_depths.py +0 -0
  131. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_quantization/test_configs/test_strategies.py +0 -0
  132. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_quantization/test_quant_args.py +0 -0
  133. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_quantization/test_quant_config.py +0 -0
  134. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_quantization/test_quant_scheme.py +0 -0
  135. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_registry.py +0 -0
  136. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_transform/conftest.py +0 -0
  137. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_transform/factory/test_correctness.py +0 -0
  138. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_transform/factory/test_memory.py +0 -0
  139. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_transform/test_transform_args.py +0 -0
  140. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_transform/test_transform_config.py +0 -0
  141. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_transform/test_transform_scheme.py +0 -0
  142. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_transform/utils/test_hadamard.py +0 -0
  143. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_utils/__init__.py +0 -0
  144. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_utils/test_helpers.py +0 -0
  145. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_utils/test_match.py +0 -0
  146. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_utils/test_offload.py +0 -0
  147. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/test_utils/test_safetensors_load.py +0 -0
  148. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/tests/testing_utils.py +0 -0
  149. {compressed_tensors-0.10.3a20250728 → compressed_tensors-0.10.3a20250731}/utils/copyright.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: compressed-tensors
3
- Version: 0.10.3a20250728
3
+ Version: 0.10.3a20250731
4
4
  Summary: Library for utilization of compressed safetensors of neural network models
5
5
  Home-page: https://github.com/neuralmagic/compressed-tensors
6
6
  Author: Neuralmagic, Inc.
@@ -61,6 +61,27 @@ class NVFP4PackedCompressor(BaseQuantizationCompressor):
61
61
  "weight_global_scale",
62
62
  )
63
63
 
64
+ def compression_param_info(
65
+ self,
66
+ weight_shape: torch.Size,
67
+ quantization_args: Optional[QuantizationArgs] = None,
68
+ ) -> Dict[str, Tuple[torch.Size, torch.dtype]]:
69
+ """
70
+ Creates a dictionary of expected shapes and dtypes for each compression
71
+ parameter used by the compressor
72
+
73
+ :param weight_shape: uncompressed weight shape
74
+ :param quantization_args: quantization parameters for the weight
75
+ :return: dictionary mapping compressed parameter names to shape and dtype
76
+ """
77
+ output = {
78
+ "weight_packed": (
79
+ torch.Size((weight_shape[0], weight_shape[1] // 2)),
80
+ torch.uint8,
81
+ ),
82
+ }
83
+ return output
84
+
64
85
  def compress_weight(
65
86
  self,
66
87
  weight: Tensor,
@@ -257,13 +257,10 @@ def _process_quantization(
257
257
  QuantizationStrategy.GROUP,
258
258
  QuantizationStrategy.TENSOR_GROUP,
259
259
  ):
260
- n_dims = x.shape
261
- if len(n_dims) > 2:
262
- x = x.squeeze(0)
263
260
 
264
261
  output_dtype = dtype if dtype is not None else x.dtype
265
262
  output = torch.zeros_like(x).to(output_dtype)
266
- columns = output.shape[1]
263
+ columns = output.shape[-1]
267
264
 
268
265
  # TODO: make validation step for inputs
269
266
 
@@ -293,14 +290,12 @@ def _process_quantization(
293
290
  perm = torch.argsort(g_idx)
294
291
  x = safe_permute(x, perm, dim=1)
295
292
 
296
- x = torch.reshape(
297
- x,
298
- (
299
- x.shape[0],
300
- ceil(x.shape[1] / group_size),
301
- group_size,
302
- ),
293
+ # Maintain all dimensions apart from the last dim, which is divided by the group_size
294
+ reshaped_dims = (
295
+ ceil(x.shape[-1] / group_size),
296
+ group_size,
303
297
  )
298
+ x = x.unflatten(-1, reshaped_dims)
304
299
 
305
300
  if do_quantize:
306
301
  output = _quantize(
@@ -323,19 +318,12 @@ def _process_quantization(
323
318
  global_scale=global_scale,
324
319
  )
325
320
 
326
- output = torch.reshape(
327
- output,
328
- (output.shape[0], output.shape[1] * output.shape[2]),
329
- )
330
-
321
+ output = output.flatten(start_dim=-2)
331
322
  output = output.to(output_dtype)
332
323
 
333
324
  if not is_column_order:
334
325
  output = safe_permute(output, torch.argsort(perm), dim=1)
335
326
 
336
- if len(n_dims) > 2:
337
- output = output.unsqueeze(0)
338
-
339
327
  else: # covers channel, token and tensor strategies
340
328
  if do_quantize:
341
329
  output = _quantize(
@@ -175,20 +175,16 @@ def compute_dynamic_scales_and_zp(
175
175
  QuantizationStrategy.TENSOR_GROUP,
176
176
  QuantizationStrategy.GROUP,
177
177
  ):
178
- if len(value.shape) > 2:
179
- value = value.squeeze(0)
180
178
 
181
- dim = {0, 1}
182
- reduce_dims = tuple(idx for idx in range(3) if idx not in dim)
179
+ reduce_dims = -1
183
180
  keep_dims = False
184
- value = torch.reshape(
185
- value,
186
- (
187
- value.shape[0],
188
- math.ceil(value.shape[1] / args.group_size),
189
- args.group_size,
190
- ),
181
+
182
+ reshaped_dims = (
183
+ math.ceil(value.shape[-1] / args.group_size),
184
+ args.group_size,
191
185
  )
186
+ value = value.unflatten(-1, reshaped_dims)
187
+
192
188
  else:
193
189
  supported_strategies = (
194
190
  QuantizationStrategy.TOKEN,
@@ -17,5 +17,5 @@ __version__: str
17
17
  __version_tuple__: VERSION_TUPLE
18
18
  version_tuple: VERSION_TUPLE
19
19
 
20
- __version__ = version = '0.10.3.a20250728'
20
+ __version__ = version = '0.10.3.a20250731'
21
21
  __version_tuple__ = version_tuple = (0, 10, 3)
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: compressed-tensors
3
- Version: 0.10.3a20250728
3
+ Version: 0.10.3a20250731
4
4
  Summary: Library for utilization of compressed safetensors of neural network models
5
5
  Home-page: https://github.com/neuralmagic/compressed-tensors
6
6
  Author: Neuralmagic, Inc.
@@ -83,7 +83,7 @@ def test_fused_global_scales():
83
83
  "shape,group_size,exp_shape",
84
84
  [
85
85
  # Only batch size =1 is supported for dynamic GROUP quantization
86
- ((1, 4, 8), 4, torch.Size([4, 2])),
86
+ ((1, 4, 8), 4, torch.Size([1, 4, 2])),
87
87
  ],
88
88
  )
89
89
  def test_compute_dynamic_scales_and_zp_group(shape, group_size, exp_shape):