compressed-tensors 0.13.1a20260109__tar.gz → 0.13.1a20260116__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {compressed_tensors-0.13.1a20260109/src/compressed_tensors.egg-info → compressed_tensors-0.13.1a20260116}/PKG-INFO +1 -1
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/quantization/quant_scheme.py +21 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/quantization/utils/mxfp4_utils.py +1 -1
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/version.py +1 -1
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116/src/compressed_tensors.egg-info}/PKG-INFO +1 -1
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_quantization/test_utils/test_mxfp4_utils.py +1 -1
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/.github/.gitkeep +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/.github/actions/test/action.yml +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/.github/scripts/step-status +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/.github/workflows/quality-check.yaml +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/.github/workflows/test-check.yaml +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/.gitignore +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/LICENSE +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/Makefile +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/README.md +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/examples/bit_packing/ex_quantize_and_pack.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/examples/bit_packing/int4_config.json +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/examples/bitmask_compression.ipynb +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/examples/llama_1.1b/ex_config_quantization.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/examples/llama_1.1b/ex_llmcompressor_quantization.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/examples/llama_1.1b/example_quant_config.json +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/examples/llama_1.1b/example_quant_recipe.yaml +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/examples/quantize_and_pack_int4.ipynb +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/pyproject.toml +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/setup.cfg +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/setup.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/__init__.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/README.md +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/__init__.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/base.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/compressors/__init__.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/compressors/base.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/compressors/helpers.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/compressors/model_compressors/__init__.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/compressors/model_compressors/model_compressor.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/compressors/quantized_compressors/__init__.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/compressors/quantized_compressors/base.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/compressors/quantized_compressors/fp4_quantized.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/compressors/quantized_compressors/naive_quantized.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/compressors/quantized_compressors/pack_quantized.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/compressors/sparse_compressors/__init__.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/compressors/sparse_compressors/base.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/compressors/sparse_compressors/dense.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/compressors/sparse_compressors/sparse_24_bitmask.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/compressors/sparse_compressors/sparse_bitmask.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/compressors/sparse_quantized_compressors/__init__.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/compressors/sparse_quantized_compressors/marlin_24.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/config/__init__.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/config/base.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/config/dense.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/config/format.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/config/sparse_24_bitmask.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/config/sparse_bitmask.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/linear/__init__.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/linear/compressed_linear.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/logger.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/modeling/__init__.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/modeling/attention.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/modeling/kvcache.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/quantization/__init__.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/quantization/lifecycle/__init__.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/quantization/lifecycle/apply.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/quantization/lifecycle/compressed.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/quantization/lifecycle/forward.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/quantization/lifecycle/helpers.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/quantization/lifecycle/initialize.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/quantization/quant_args.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/quantization/quant_config.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/quantization/quant_metadata.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/quantization/utils/__init__.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/quantization/utils/helpers.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/registry/__init__.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/registry/registry.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/transform/__init__.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/transform/apply.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/transform/factory/__init__.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/transform/factory/base.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/transform/factory/hadamard.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/transform/factory/matrix_multiply.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/transform/factory/random_hadamard.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/transform/transform_args.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/transform/transform_config.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/transform/transform_scheme.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/transform/utils/__init__.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/transform/utils/hadamard.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/transform/utils/hadamards.safetensors +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/transform/utils/matrix.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/utils/__init__.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/utils/helpers.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/utils/internal.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/utils/match.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/utils/offload.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/utils/permutations_24.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/utils/safetensors_load.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/utils/semi_structured_conversions.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors/utils/type.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors.egg-info/SOURCES.txt +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors.egg-info/dependency_links.txt +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors.egg-info/requires.txt +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/src/compressed_tensors.egg-info/top_level.txt +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/__init__.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/conftest.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/mock_observer.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_compressors/__init__.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_compressors/model_compressors/__init__.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_compressors/model_compressors/test_model_compressor.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_compressors/quantized_compressors/__init__.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_compressors/quantized_compressors/test_fp4_quant.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_compressors/quantized_compressors/test_fp8_quant.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_compressors/quantized_compressors/test_int_quant.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_compressors/quantized_compressors/test_pack_quant.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_compressors/quantized_compressors/test_packed_asym_decompression.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_compressors/sparse_compressors/__init__.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_compressors/sparse_compressors/test_bitmask.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_compressors/sparse_compressors/test_sparse_24_bitmask.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_compressors/sparse_quantized_compressors/__init__.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_compressors/sparse_quantized_compressors/test_marlin_24.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_configs/__init__.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_configs/test_base.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_configs/test_infer_quant.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_examples/test_bitmask_compression_ipynb.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_linear/__init__.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_linear/test_compressed_linear.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_modeling/test_attention_and_cache.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_quantization/__init__.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_quantization/lifecycle/__init__.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_quantization/lifecycle/conftest.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_quantization/lifecycle/test_apply.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_quantization/lifecycle/test_dynamic_lifecycle.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_quantization/lifecycle/test_enabled.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_quantization/lifecycle/test_forward.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_quantization/lifecycle/test_initialize.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_quantization/lifecycle/test_lifecycle.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_quantization/lifecycle/test_static_lifecycle.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_quantization/test_configs/__init__.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_quantization/test_configs/test_bit_depths.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_quantization/test_configs/test_strategies.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_quantization/test_quant_args.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_quantization/test_quant_config.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_quantization/test_quant_scheme.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_quantization/test_utils/test_helpers.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_registry.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_transform/conftest.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_transform/factory/test_correctness.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_transform/factory/test_memory.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_transform/factory/test_serialization.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_transform/test_transform_args.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_transform/test_transform_config.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_transform/test_transform_scheme.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_transform/utils/test_hadamard.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_utils/__init__.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_utils/test_helpers.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_utils/test_match.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_utils/test_offload.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_utils/test_safetensors_load.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_utils/test_type.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/testing_utils.py +0 -0
- {compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/utils/copyright.py +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: compressed-tensors
|
|
3
|
-
Version: 0.13.
|
|
3
|
+
Version: 0.13.1a20260116
|
|
4
4
|
Summary: Library for utilization of compressed safetensors of neural network models
|
|
5
5
|
Home-page: https://github.com/vllm-project/compressed-tensors
|
|
6
6
|
Author: Neuralmagic, Inc.
|
|
@@ -303,6 +303,26 @@ INT8_W4A8 = dict(
|
|
|
303
303
|
),
|
|
304
304
|
)
|
|
305
305
|
|
|
306
|
+
# 4 bit integer weights and 8 bit FP activations quantization
|
|
307
|
+
W4AFP8 = dict(
|
|
308
|
+
weights=QuantizationArgs(
|
|
309
|
+
num_bits=4,
|
|
310
|
+
type=QuantizationType.INT,
|
|
311
|
+
strategy=QuantizationStrategy.GROUP,
|
|
312
|
+
group_size=128,
|
|
313
|
+
symmetric=True,
|
|
314
|
+
dynamic=False,
|
|
315
|
+
),
|
|
316
|
+
input_activations=QuantizationArgs(
|
|
317
|
+
num_bits=8,
|
|
318
|
+
type=QuantizationType.FLOAT,
|
|
319
|
+
strategy=QuantizationStrategy.TOKEN,
|
|
320
|
+
symmetric=True,
|
|
321
|
+
dynamic=True,
|
|
322
|
+
observer=None,
|
|
323
|
+
),
|
|
324
|
+
)
|
|
325
|
+
|
|
306
326
|
# FP8 weights and FP8 activations quantization
|
|
307
327
|
FP8 = dict(
|
|
308
328
|
weights=QuantizationArgs(
|
|
@@ -374,6 +394,7 @@ PRESET_SCHEMES = {
|
|
|
374
394
|
"W8A8": INT8_W8A8,
|
|
375
395
|
"INT8": INT8_W8A8, # alias for W8A8
|
|
376
396
|
"W4A8": INT8_W4A8,
|
|
397
|
+
"W4AFP8": W4AFP8,
|
|
377
398
|
# Float weight and activation schemes
|
|
378
399
|
"FP8": FP8,
|
|
379
400
|
"FP8_DYNAMIC": FP8_DYNAMIC,
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: compressed-tensors
|
|
3
|
-
Version: 0.13.
|
|
3
|
+
Version: 0.13.1a20260116
|
|
4
4
|
Summary: Library for utilization of compressed safetensors of neural network models
|
|
5
5
|
Home-page: https://github.com/vllm-project/compressed-tensors
|
|
6
6
|
Author: Neuralmagic, Inc.
|
|
@@ -93,5 +93,5 @@ def test_mxfp4_scales_e2e():
|
|
|
93
93
|
converted_ct = maybe_convert_from_mxfp4_exp(args=args, scale=scales)
|
|
94
94
|
|
|
95
95
|
scales_exp = torch.log2(converted_ct)
|
|
96
|
-
block_max_exp = torch.floor(torch.log2(round_to_power_2(block_max)))
|
|
96
|
+
block_max_exp = torch.floor(torch.log2(round_to_power_2(block_max))) - 2
|
|
97
97
|
assert torch.equal(scales_exp, block_max_exp)
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/mock_observer.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/test_registry.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/tests/testing_utils.py
RENAMED
|
File without changes
|
{compressed_tensors-0.13.1a20260109 → compressed_tensors-0.13.1a20260116}/utils/copyright.py
RENAMED
|
File without changes
|