compressed-tensors 0.12.3a20251007__tar.gz → 0.12.3a20251008__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/PKG-INFO +1 -1
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/quantization/quant_args.py +10 -1
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/version.py +1 -1
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors.egg-info/PKG-INFO +1 -1
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/test_utils/test_helpers.py +13 -7
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/.github/.gitkeep +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/.github/actions/test/action.yml +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/.github/scripts/step-status +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/.github/workflows/build-test.yml +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/.github/workflows/build.yml +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/.github/workflows/post-release-nightly-build.yml +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/.github/workflows/quality-check.yaml +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/.github/workflows/report.yml +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/.github/workflows/test-check.yaml +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/.github/workflows/test.yml +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/.github/workflows/trigger-all.yml +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/.github/workflows/upload.yml +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/.gitignore +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/LICENSE +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/Makefile +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/README.md +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/examples/bit_packing/ex_quantize_and_pack.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/examples/bit_packing/int4_config.json +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/examples/bitmask_compression.ipynb +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/examples/llama_1.1b/ex_config_quantization.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/examples/llama_1.1b/ex_llmcompressor_quantization.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/examples/llama_1.1b/example_quant_config.json +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/examples/llama_1.1b/example_quant_recipe.yaml +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/examples/quantize_and_pack_int4.ipynb +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/pyproject.toml +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/setup.cfg +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/setup.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/__init__.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/README.md +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/__init__.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/base.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/__init__.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/base.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/helpers.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/model_compressors/__init__.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/model_compressors/model_compressor.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/quantized_compressors/__init__.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/quantized_compressors/base.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/quantized_compressors/naive_quantized.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/quantized_compressors/nvfp4_quantized.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/quantized_compressors/pack_quantized.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/sparse_compressors/__init__.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/sparse_compressors/base.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/sparse_compressors/dense.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/sparse_compressors/sparse_24_bitmask.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/sparse_compressors/sparse_bitmask.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/sparse_quantized_compressors/__init__.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/compressors/sparse_quantized_compressors/marlin_24.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/config/__init__.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/config/base.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/config/dense.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/config/format.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/config/sparse_24_bitmask.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/config/sparse_bitmask.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/linear/__init__.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/linear/compressed_linear.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/logger.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/quantization/__init__.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/quantization/lifecycle/__init__.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/quantization/lifecycle/apply.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/quantization/lifecycle/compressed.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/quantization/lifecycle/forward.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/quantization/lifecycle/helpers.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/quantization/lifecycle/initialize.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/quantization/quant_config.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/quantization/quant_metadata.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/quantization/quant_scheme.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/quantization/utils/__init__.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/quantization/utils/helpers.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/registry/__init__.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/registry/registry.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/transform/__init__.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/transform/apply.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/transform/factory/__init__.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/transform/factory/base.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/transform/factory/hadamard.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/transform/factory/matrix_multiply.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/transform/factory/random_hadamard.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/transform/transform_args.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/transform/transform_config.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/transform/transform_scheme.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/transform/utils/__init__.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/transform/utils/hadamard.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/transform/utils/hadamards.safetensors +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/transform/utils/matrix.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/utils/__init__.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/utils/helpers.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/utils/internal.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/utils/match.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/utils/offload.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/utils/permutations_24.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/utils/safetensors_load.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/utils/semi_structured_conversions.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors/utils/type.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors.egg-info/SOURCES.txt +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors.egg-info/dependency_links.txt +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors.egg-info/requires.txt +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/src/compressed_tensors.egg-info/top_level.txt +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/__init__.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/conftest.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_compressors/__init__.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_compressors/model_compressors/__init__.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_compressors/model_compressors/test_model_compressor.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_compressors/quantized_compressors/__init__.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_compressors/quantized_compressors/test_fp8_quant.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_compressors/quantized_compressors/test_int_quant.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_compressors/quantized_compressors/test_nvfp4_quant.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_compressors/quantized_compressors/test_pack_quant.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_compressors/sparse_compressors/__init__.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_compressors/sparse_compressors/test_bitmask.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_compressors/sparse_compressors/test_sparse_24_bitmask.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_compressors/sparse_quantized_compressors/__init__.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_compressors/sparse_quantized_compressors/test_marlin_24.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_configs/__init__.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_configs/test_base.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_configs/test_infer_quant.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_examples/test_bitmask_compression_ipynb.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_linear/__init__.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_linear/test_compressed_linear.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/__init__.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/lifecycle/__init__.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/lifecycle/conftest.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/lifecycle/test_apply.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/lifecycle/test_dynamic_lifecycle.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/lifecycle/test_enabled.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/lifecycle/test_forward.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/lifecycle/test_initialize.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/lifecycle/test_lifecycle.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/test_configs/__init__.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/test_configs/test_bit_depths.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/test_configs/test_strategies.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/test_quant_args.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/test_quant_config.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_quantization/test_quant_scheme.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_registry.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_transform/conftest.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_transform/factory/test_correctness.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_transform/factory/test_memory.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_transform/factory/test_serialization.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_transform/test_transform_args.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_transform/test_transform_config.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_transform/test_transform_scheme.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_transform/utils/test_hadamard.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_utils/__init__.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_utils/test_helpers.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_utils/test_match.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_utils/test_offload.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_utils/test_safetensors_load.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_utils/test_type.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/testing_utils.py +0 -0
- {compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/utils/copyright.py +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: compressed-tensors
|
|
3
|
-
Version: 0.12.
|
|
3
|
+
Version: 0.12.3a20251008
|
|
4
4
|
Summary: Library for utilization of compressed safetensors of neural network models
|
|
5
5
|
Home-page: https://github.com/neuralmagic/compressed-tensors
|
|
6
6
|
Author: Neuralmagic, Inc.
|
|
@@ -259,6 +259,7 @@ class QuantizationArgs(BaseModel, use_enum_values=True):
|
|
|
259
259
|
# extract user-passed values from dictionary
|
|
260
260
|
strategy = model.strategy
|
|
261
261
|
group_size = model.group_size
|
|
262
|
+
block_structure = model.block_structure
|
|
262
263
|
actorder = model.actorder
|
|
263
264
|
dynamic = model.dynamic
|
|
264
265
|
observer = model.observer
|
|
@@ -277,7 +278,7 @@ class QuantizationArgs(BaseModel, use_enum_values=True):
|
|
|
277
278
|
"strategy='group' and group_size = -1 for 'channel'"
|
|
278
279
|
)
|
|
279
280
|
|
|
280
|
-
# validate strategy
|
|
281
|
+
# validate group strategy
|
|
281
282
|
if strategy == QuantizationStrategy.GROUP:
|
|
282
283
|
if group_size is None or group_size <= 0:
|
|
283
284
|
raise ValueError(
|
|
@@ -292,6 +293,14 @@ class QuantizationArgs(BaseModel, use_enum_values=True):
|
|
|
292
293
|
):
|
|
293
294
|
raise ValueError("group_size requires strategy to be set to 'group'")
|
|
294
295
|
|
|
296
|
+
# validate block strategy
|
|
297
|
+
has_block_strategy = strategy == QuantizationStrategy.BLOCK
|
|
298
|
+
has_block_structure = block_structure is not None
|
|
299
|
+
if has_block_strategy and not has_block_structure:
|
|
300
|
+
raise ValueError(f"Block strategy requires block structure\n{model}")
|
|
301
|
+
if has_block_structure and not has_block_strategy:
|
|
302
|
+
raise ValueError(f"Block structure requires block strategy\n{model}")
|
|
303
|
+
|
|
295
304
|
# validate activation ordering and strategy
|
|
296
305
|
if actorder is not None and strategy != QuantizationStrategy.GROUP:
|
|
297
306
|
raise ValueError(
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: compressed-tensors
|
|
3
|
-
Version: 0.12.
|
|
3
|
+
Version: 0.12.3a20251008
|
|
4
4
|
Summary: Library for utilization of compressed safetensors of neural network models
|
|
5
5
|
Home-page: https://github.com/neuralmagic/compressed-tensors
|
|
6
6
|
Author: Neuralmagic, Inc.
|
|
@@ -32,36 +32,42 @@ from compressed_tensors.quantization.utils import (
|
|
|
32
32
|
[
|
|
33
33
|
(
|
|
34
34
|
False,
|
|
35
|
-
|
|
35
|
+
"tensor",
|
|
36
36
|
torch.Size(
|
|
37
37
|
[
|
|
38
38
|
1,
|
|
39
39
|
]
|
|
40
40
|
),
|
|
41
41
|
),
|
|
42
|
-
(True,
|
|
43
|
-
(True,
|
|
42
|
+
(True, "channel", torch.Size([1, 1])),
|
|
43
|
+
(True, "group", torch.Size([1, 1])),
|
|
44
44
|
(
|
|
45
45
|
False,
|
|
46
|
-
|
|
46
|
+
"block",
|
|
47
47
|
torch.Size(
|
|
48
48
|
[
|
|
49
49
|
1,
|
|
50
50
|
]
|
|
51
51
|
),
|
|
52
52
|
),
|
|
53
|
-
(True,
|
|
53
|
+
(True, "token", torch.Size([1, 1])),
|
|
54
54
|
],
|
|
55
55
|
)
|
|
56
56
|
def test_calculate_qparams(keepdims, strategy, exp_shape):
|
|
57
|
-
value = torch.
|
|
57
|
+
value = torch.empty(5, 6)
|
|
58
58
|
min_val = torch.amin(value, dim=tuple(), keepdims=keepdims)
|
|
59
59
|
max_val = torch.amax(value, dim=tuple(), keepdims=keepdims)
|
|
60
60
|
|
|
61
61
|
if strategy == QuantizationStrategy.GROUP:
|
|
62
62
|
args = QuantizationArgs(strategy=strategy, group_size=2)
|
|
63
|
+
elif strategy == QuantizationStrategy.BLOCK:
|
|
64
|
+
args = QuantizationArgs(strategy=strategy, block_structure=[1, 3])
|
|
63
65
|
else:
|
|
64
|
-
args = QuantizationArgs(
|
|
66
|
+
args = QuantizationArgs(
|
|
67
|
+
strategy=strategy,
|
|
68
|
+
group_size=(2 if strategy == "group" else None),
|
|
69
|
+
block_structure=([1, 3] if strategy == "block" else None),
|
|
70
|
+
)
|
|
65
71
|
scale, zp = calculate_qparams(min_val, max_val, args)
|
|
66
72
|
assert scale.shape == exp_shape
|
|
67
73
|
assert zp.shape == exp_shape
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/.github/workflows/test.yml
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/test_registry.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/tests/testing_utils.py
RENAMED
|
File without changes
|
{compressed_tensors-0.12.3a20251007 → compressed_tensors-0.12.3a20251008}/utils/copyright.py
RENAMED
|
File without changes
|