compressed-tensors 0.11.1a20250929__tar.gz → 0.12.0__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/.github/actions/test/action.yml +3 -4
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/.github/workflows/test-check.yaml +9 -4
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/.github/workflows/test.yml +7 -8
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/.github/workflows/trigger-all.yml +3 -3
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/PKG-INFO +1 -1
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/transform/factory/hadamard.py +1 -1
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/transform/factory/matrix_multiply.py +1 -1
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/transform/transform_scheme.py +7 -18
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/version.py +2 -2
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors.egg-info/PKG-INFO +1 -1
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_transform/factory/test_correctness.py +2 -2
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_transform/test_transform_scheme.py +0 -25
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_utils/test_helpers.py +6 -7
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/.github/.gitkeep +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/.github/scripts/step-status +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/.github/workflows/build-test.yml +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/.github/workflows/build.yml +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/.github/workflows/quality-check.yaml +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/.github/workflows/report.yml +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/.github/workflows/upload.yml +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/.gitignore +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/LICENSE +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/Makefile +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/README.md +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/examples/bit_packing/ex_quantize_and_pack.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/examples/bit_packing/int4_config.json +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/examples/bitmask_compression.ipynb +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/examples/llama_1.1b/ex_config_quantization.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/examples/llama_1.1b/ex_llmcompressor_quantization.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/examples/llama_1.1b/example_quant_config.json +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/examples/llama_1.1b/example_quant_recipe.yaml +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/examples/quantize_and_pack_int4.ipynb +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/pyproject.toml +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/setup.cfg +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/setup.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/__init__.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/README.md +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/__init__.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/base.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/compressors/__init__.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/compressors/base.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/compressors/helpers.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/compressors/model_compressors/__init__.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/compressors/model_compressors/model_compressor.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/compressors/quantized_compressors/__init__.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/compressors/quantized_compressors/base.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/compressors/quantized_compressors/naive_quantized.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/compressors/quantized_compressors/nvfp4_quantized.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/compressors/quantized_compressors/pack_quantized.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/compressors/sparse_compressors/__init__.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/compressors/sparse_compressors/base.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/compressors/sparse_compressors/dense.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/compressors/sparse_compressors/sparse_24_bitmask.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/compressors/sparse_compressors/sparse_bitmask.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/compressors/sparse_quantized_compressors/__init__.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/compressors/sparse_quantized_compressors/marlin_24.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/config/__init__.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/config/base.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/config/dense.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/config/format.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/config/sparse_24_bitmask.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/config/sparse_bitmask.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/linear/__init__.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/linear/compressed_linear.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/logger.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/quantization/__init__.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/quantization/lifecycle/__init__.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/quantization/lifecycle/apply.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/quantization/lifecycle/compressed.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/quantization/lifecycle/forward.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/quantization/lifecycle/helpers.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/quantization/lifecycle/initialize.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/quantization/quant_args.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/quantization/quant_config.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/quantization/quant_metadata.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/quantization/quant_scheme.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/quantization/utils/__init__.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/quantization/utils/helpers.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/registry/__init__.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/registry/registry.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/transform/__init__.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/transform/apply.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/transform/factory/__init__.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/transform/factory/base.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/transform/factory/random_hadamard.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/transform/transform_args.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/transform/transform_config.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/transform/utils/__init__.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/transform/utils/hadamard.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/transform/utils/hadamards.safetensors +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/transform/utils/matrix.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/utils/__init__.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/utils/helpers.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/utils/internal.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/utils/match.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/utils/offload.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/utils/permutations_24.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/utils/permute.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/utils/safetensors_load.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/utils/semi_structured_conversions.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/utils/type.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors.egg-info/SOURCES.txt +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors.egg-info/dependency_links.txt +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors.egg-info/requires.txt +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors.egg-info/top_level.txt +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/__init__.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/conftest.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_compressors/__init__.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_compressors/model_compressors/__init__.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_compressors/model_compressors/test_model_compressor.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_compressors/quantized_compressors/__init__.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_compressors/quantized_compressors/test_fp8_quant.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_compressors/quantized_compressors/test_int_quant.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_compressors/quantized_compressors/test_nvfp4_quant.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_compressors/quantized_compressors/test_pack_quant.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_compressors/sparse_compressors/__init__.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_compressors/sparse_compressors/test_bitmask.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_compressors/sparse_compressors/test_sparse_24_bitmask.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_compressors/sparse_quantized_compressors/__init__.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_compressors/sparse_quantized_compressors/test_marlin_24.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_configs/__init__.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_configs/test_base.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_configs/test_infer_quant.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_examples/test_bitmask_compression_ipynb.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_linear/__init__.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_linear/test_compressed_linear.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_quantization/__init__.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_quantization/lifecycle/__init__.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_quantization/lifecycle/conftest.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_quantization/lifecycle/test_apply.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_quantization/lifecycle/test_dynamic_lifecycle.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_quantization/lifecycle/test_enabled.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_quantization/lifecycle/test_forward.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_quantization/lifecycle/test_helpers.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_quantization/lifecycle/test_initialize.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_quantization/lifecycle/test_lifecycle.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_quantization/test_configs/__init__.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_quantization/test_configs/test_bit_depths.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_quantization/test_configs/test_strategies.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_quantization/test_quant_args.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_quantization/test_quant_config.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_quantization/test_quant_scheme.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_quantization/test_utils/test_helpers.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_registry.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_transform/conftest.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_transform/factory/test_memory.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_transform/factory/test_serialization.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_transform/test_transform_args.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_transform/test_transform_config.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_transform/utils/test_hadamard.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_utils/__init__.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_utils/test_match.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_utils/test_offload.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_utils/test_safetensors_load.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_utils/test_type.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/testing_utils.py +0 -0
- {compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/utils/copyright.py +0 -0
{compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/.github/actions/test/action.yml
RENAMED
|
@@ -9,8 +9,7 @@ inputs:
|
|
|
9
9
|
required: true
|
|
10
10
|
code_coverage:
|
|
11
11
|
description: whether to collect code coverage metrics during test run
|
|
12
|
-
|
|
13
|
-
default: false
|
|
12
|
+
default: 'false'
|
|
14
13
|
outputs:
|
|
15
14
|
status:
|
|
16
15
|
description: "final status from test"
|
|
@@ -51,7 +50,7 @@ runs:
|
|
|
51
50
|
|
|
52
51
|
if [[ "${ENABLE_COVERAGE}" == "true" ]]; then
|
|
53
52
|
echo "::group::Installing code coverage requirements via pip"
|
|
54
|
-
pip install
|
|
53
|
+
pip install https://github.com/neuralmagic/pytest-nm-releng/archive/v0.4.0.tar.gz
|
|
55
54
|
pip install coverage pytest-cov
|
|
56
55
|
|
|
57
56
|
# Adding Code coverage to the tests
|
|
@@ -76,7 +75,7 @@ runs:
|
|
|
76
75
|
fi
|
|
77
76
|
echo "::endgroup::"
|
|
78
77
|
fi
|
|
79
|
-
|
|
78
|
+
|
|
80
79
|
deactivate
|
|
81
80
|
exit ${SUCCESS}
|
|
82
81
|
shell: bash
|
{compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/.github/workflows/test-check.yaml
RENAMED
|
@@ -12,7 +12,10 @@ on:
|
|
|
12
12
|
|
|
13
13
|
jobs:
|
|
14
14
|
python-tests:
|
|
15
|
-
runs-on:
|
|
15
|
+
runs-on: k8s-util
|
|
16
|
+
env:
|
|
17
|
+
HF_HOME: /model-cache
|
|
18
|
+
HF_TOKEN: ${{ secrets.NM_HF_TOKEN_READ_ONLY }}
|
|
16
19
|
steps:
|
|
17
20
|
- uses: actions/setup-python@v5
|
|
18
21
|
with:
|
|
@@ -21,11 +24,13 @@ jobs:
|
|
|
21
24
|
with:
|
|
22
25
|
fetch-depth: 0
|
|
23
26
|
fetch-tags: true
|
|
27
|
+
- name: Install system dependencies
|
|
28
|
+
run: |-
|
|
29
|
+
sudo apt-get update
|
|
30
|
+
sudo apt-get install -y --no-install-recommends g++ gcc make
|
|
24
31
|
- name: Set Env
|
|
25
|
-
run:
|
|
26
|
-
pip3 install --upgrade pip && pip3 install --upgrade setuptools
|
|
32
|
+
run: pip3 install --upgrade pip setuptools
|
|
27
33
|
- name: "⚙️ Install dependencies"
|
|
28
34
|
run: pip3 install .[dev,accelerate]
|
|
29
35
|
- name: "🔬 Running tests"
|
|
30
36
|
run: make test
|
|
31
|
-
|
|
@@ -71,6 +71,9 @@ jobs:
|
|
|
71
71
|
contents: 'read'
|
|
72
72
|
id-token: 'write'
|
|
73
73
|
pages: 'write'
|
|
74
|
+
env:
|
|
75
|
+
HF_HOME: /model-cache
|
|
76
|
+
HF_TOKEN: ${{ secrets.NM_HF_TOKEN_READ_ONLY }}
|
|
74
77
|
environment:
|
|
75
78
|
name: github-pages
|
|
76
79
|
url: ${{ steps.coverage.outputs.page_url }}
|
|
@@ -90,13 +93,9 @@ jobs:
|
|
|
90
93
|
python-version: ${{ inputs.python }}
|
|
91
94
|
|
|
92
95
|
- name: install system dependencies
|
|
93
|
-
run:
|
|
94
|
-
|
|
95
|
-
|
|
96
|
-
else
|
|
97
|
-
echo "installing g++ etc compilers..."
|
|
98
|
-
sudo apt update && sudo apt install -y g++ gcc
|
|
99
|
-
fi
|
|
96
|
+
run: |-
|
|
97
|
+
sudo apt-get update
|
|
98
|
+
sudo apt-get install -y --no-install-recommends g++ gcc make
|
|
100
99
|
shell: bash
|
|
101
100
|
|
|
102
101
|
- name: checkout code
|
|
@@ -172,7 +171,7 @@ jobs:
|
|
|
172
171
|
uses: actions/upload-artifact@v4
|
|
173
172
|
if: success() || failure()
|
|
174
173
|
with:
|
|
175
|
-
name: report-${{ inputs.test_label }}.xml
|
|
174
|
+
name: report-${{ inputs.python }}-${{ inputs.test_label }}.xml
|
|
176
175
|
path: test-results/report.xml
|
|
177
176
|
retention-days: 5
|
|
178
177
|
|
{compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/.github/workflows/trigger-all.yml
RENAMED
|
@@ -19,7 +19,7 @@ on:
|
|
|
19
19
|
type: boolean
|
|
20
20
|
default: false
|
|
21
21
|
gitref:
|
|
22
|
-
description: "git commit hash or tag name"
|
|
22
|
+
description: "git commit hash or tag name"
|
|
23
23
|
type: string
|
|
24
24
|
default: 'main'
|
|
25
25
|
|
|
@@ -32,8 +32,8 @@ jobs:
|
|
|
32
32
|
wf_category: ${{ inputs.wf_category || 'NIGHTLY' }}
|
|
33
33
|
gitref: ${{ inputs.gitref || 'main' }}
|
|
34
34
|
push_to_pypi: ${{ (github.event.schedule == '30 0 * * *') || inputs.push_to_pypi || false }}
|
|
35
|
-
test_configs: '[{"python":"3.11.4","label":"
|
|
36
|
-
{"python":"3.10.12","label":"
|
|
35
|
+
test_configs: '[{"python":"3.11.4","label":"k8s-util","timeout":"40","code_coverage":true},
|
|
36
|
+
{"python":"3.10.12","label":"k8s-util","timeout":"40"},
|
|
37
37
|
{"python":"3.9.17","label":"k8s-h100-solo","timeout":"40"},
|
|
38
38
|
{"python":"3.12.6","label":"k8s-a100-duo","timeout":"40"}]'
|
|
39
39
|
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: compressed-tensors
|
|
3
|
-
Version: 0.
|
|
3
|
+
Version: 0.12.0
|
|
4
4
|
Summary: Library for utilization of compressed safetensors of neural network models
|
|
5
5
|
Home-page: https://github.com/neuralmagic/compressed-tensors
|
|
6
6
|
Author: Neuralmagic, Inc.
|
|
@@ -52,7 +52,7 @@ class HadamardFactory(TransformFactory):
|
|
|
52
52
|
:param args: defines how the transform will be applied to the module
|
|
53
53
|
"""
|
|
54
54
|
assert hasattr(module, "weight")
|
|
55
|
-
size = get_transform_size(module, args.location, self.scheme.
|
|
55
|
+
size = get_transform_size(module, args.location, self.scheme.head_dim)
|
|
56
56
|
exec_device = get_execution_device(module)
|
|
57
57
|
device = get_offloaded_device(module)
|
|
58
58
|
precision = self.scheme.precision if args.is_online() else torch.float64
|
|
@@ -51,7 +51,7 @@ class RandomMatrixFactory(TransformFactory):
|
|
|
51
51
|
:param args: defines how the transform will be applied to the module
|
|
52
52
|
"""
|
|
53
53
|
assert hasattr(module, "weight")
|
|
54
|
-
size = get_transform_size(module, args.location, self.scheme.
|
|
54
|
+
size = get_transform_size(module, args.location, self.scheme.head_dim)
|
|
55
55
|
device = get_offloaded_device(module)
|
|
56
56
|
precision = self.scheme.precision if args.is_online() else torch.float64
|
|
57
57
|
|
|
@@ -17,7 +17,7 @@ from typing import List, Optional
|
|
|
17
17
|
import torch
|
|
18
18
|
from compressed_tensors.transform import TransformArgs
|
|
19
19
|
from compressed_tensors.utils import TorchDtype
|
|
20
|
-
from pydantic import BaseModel, ConfigDict, Field
|
|
20
|
+
from pydantic import BaseModel, ConfigDict, Field
|
|
21
21
|
|
|
22
22
|
|
|
23
23
|
__all__ = ["TransformScheme"]
|
|
@@ -36,8 +36,11 @@ class TransformScheme(BaseModel):
|
|
|
36
36
|
:param randomize: True if uniquely randomized transform weights should be used,
|
|
37
37
|
otherwise use identical transform weights where applicable
|
|
38
38
|
:param requires_grad: True if weights include gradients for training
|
|
39
|
-
:param
|
|
40
|
-
block being a square matrix of this size.
|
|
39
|
+
:param head_dim: If set, the transform matrix will be block diagonal with each
|
|
40
|
+
block being a square matrix of this size. The name head_dim was chosen because
|
|
41
|
+
some rotations need to be block-diagonal with block size equal to the head_dim,
|
|
42
|
+
but research has shown value in applying some rotations with smaller block size,
|
|
43
|
+
irrespective of head_dim.
|
|
41
44
|
:param precision: Precision at which this transform should be applied during online
|
|
42
45
|
rotations. Fused (offline) rotations are always performed in float64
|
|
43
46
|
"""
|
|
@@ -46,21 +49,7 @@ class TransformScheme(BaseModel):
|
|
|
46
49
|
apply: List[TransformArgs] = Field(default_factory=list)
|
|
47
50
|
randomize: bool = Field(default=False)
|
|
48
51
|
requires_grad: bool = Field(default=False)
|
|
49
|
-
|
|
50
|
-
head_dim: Optional[int] = Field(
|
|
51
|
-
default=None, deprecated="head_dim is deprecated, use block_size instead"
|
|
52
|
-
)
|
|
52
|
+
head_dim: Optional[int] = Field(default=None)
|
|
53
53
|
precision: TorchDtype = Field(default=torch.float32)
|
|
54
54
|
|
|
55
|
-
@model_validator(mode="after")
|
|
56
|
-
def validate_model_after(model: "TransformScheme") -> "TransformScheme":
|
|
57
|
-
"""
|
|
58
|
-
If head_dim is used instead of block_size, set block_size to head_dim
|
|
59
|
-
and remove head_dim
|
|
60
|
-
"""
|
|
61
|
-
if model.block_size is None and model.head_dim is not None:
|
|
62
|
-
model.block_size = model.head_dim
|
|
63
|
-
model.head_dim = None
|
|
64
|
-
return model
|
|
65
|
-
|
|
66
55
|
model_config = ConfigDict(extra="forbid")
|
{compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/version.py
RENAMED
|
@@ -17,5 +17,5 @@ __version__: str
|
|
|
17
17
|
__version_tuple__: VERSION_TUPLE
|
|
18
18
|
version_tuple: VERSION_TUPLE
|
|
19
19
|
|
|
20
|
-
__version__ = version = '0.
|
|
21
|
-
__version_tuple__ = version_tuple = (0,
|
|
20
|
+
__version__ = version = '0.12.0'
|
|
21
|
+
__version_tuple__ = version_tuple = (0, 12, 0)
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: compressed-tensors
|
|
3
|
-
Version: 0.
|
|
3
|
+
Version: 0.12.0
|
|
4
4
|
Summary: Library for utilization of compressed safetensors of neural network models
|
|
5
5
|
Home-page: https://github.com/neuralmagic/compressed-tensors
|
|
6
6
|
Author: Neuralmagic, Inc.
|
|
@@ -33,7 +33,7 @@ from tests.testing_utils import requires_accelerate, requires_gpu
|
|
|
33
33
|
def test_correctness_linear(type, randomize, head_dim, input_batch_size):
|
|
34
34
|
size = (4, 8)
|
|
35
35
|
module = torch.nn.Linear(*size, bias=False)
|
|
36
|
-
scheme = TransformScheme(type=type, randomize=randomize,
|
|
36
|
+
scheme = TransformScheme(type=type, randomize=randomize, head_dim=head_dim)
|
|
37
37
|
factory = TransformFactory.from_scheme(scheme, name="")
|
|
38
38
|
|
|
39
39
|
input_tfm = factory.create_transform(
|
|
@@ -150,7 +150,7 @@ def test_correctness_attention_heads(type, randomize, head_dim, input_batch_size
|
|
|
150
150
|
"": TransformScheme(
|
|
151
151
|
type=type,
|
|
152
152
|
randomize=randomize,
|
|
153
|
-
|
|
153
|
+
head_dim=head_dim,
|
|
154
154
|
apply=[
|
|
155
155
|
TransformArgs(targets="v_proj", location="weight_output"),
|
|
156
156
|
TransformArgs(
|
|
@@ -72,28 +72,3 @@ def test_multiple_groups():
|
|
|
72
72
|
assert not scheme.randomize
|
|
73
73
|
assert scheme.type == "hadamard"
|
|
74
74
|
assert len(scheme.apply) == 20
|
|
75
|
-
|
|
76
|
-
|
|
77
|
-
def test_transform_scheme_block_size():
|
|
78
|
-
"""
|
|
79
|
-
Ensure json with (deprecated) `head_dim` or `block_size`
|
|
80
|
-
both load up correctly and save with `block_size` field
|
|
81
|
-
"""
|
|
82
|
-
|
|
83
|
-
old_scheme = TransformScheme.model_validate_json(
|
|
84
|
-
'{"type": "hadamard", "head_dim": 128}'
|
|
85
|
-
)
|
|
86
|
-
assert old_scheme.block_size == 128
|
|
87
|
-
assert old_scheme.model_dump()["block_size"] == 128
|
|
88
|
-
old_scheme = TransformScheme(type="hadamard", head_dim=64)
|
|
89
|
-
assert old_scheme.block_size == 64
|
|
90
|
-
assert old_scheme.model_dump()["block_size"] == 64
|
|
91
|
-
|
|
92
|
-
new_scheme = TransformScheme.model_validate_json(
|
|
93
|
-
'{"type": "hadamard", "block_size": 128}'
|
|
94
|
-
)
|
|
95
|
-
assert new_scheme.block_size == 128
|
|
96
|
-
assert new_scheme.model_dump()["block_size"] == 128
|
|
97
|
-
new_scheme = TransformScheme(type="hadamard", block_size=64)
|
|
98
|
-
assert new_scheme.block_size == 64
|
|
99
|
-
assert new_scheme.model_dump()["block_size"] == 64
|
{compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_utils/test_helpers.py
RENAMED
|
@@ -36,12 +36,11 @@ def tensors():
|
|
|
36
36
|
|
|
37
37
|
|
|
38
38
|
@pytest.fixture
|
|
39
|
-
def llama_model(
|
|
40
|
-
|
|
41
|
-
|
|
42
|
-
|
|
39
|
+
def llama_model():
|
|
40
|
+
return AutoModelForCausalLM.from_pretrained(
|
|
41
|
+
"RedHatAI/llama2.c-stories110M-pruned50",
|
|
42
|
+
torch_dtype="auto",
|
|
43
43
|
)
|
|
44
|
-
yield model
|
|
45
44
|
|
|
46
45
|
|
|
47
46
|
def test_save_compressed_sparse_bitmask(tmp_path, tensors):
|
|
@@ -120,9 +119,9 @@ def test_load_compressed_dense(tmp_path, tensors):
|
|
|
120
119
|
|
|
121
120
|
|
|
122
121
|
def test_load_compressed_sharded(tmp_path, llama_model):
|
|
123
|
-
sharded_model_path = tmp_path / "
|
|
122
|
+
sharded_model_path = tmp_path / "sharded_model"
|
|
124
123
|
llama_model.save_pretrained(sharded_model_path, max_shard_size="2MB")
|
|
125
|
-
# make sure that model is
|
|
124
|
+
# make sure that model is sharded on disk
|
|
126
125
|
assert len(os.listdir(sharded_model_path)) > 1
|
|
127
126
|
loaded_state_dict = dict(load_compressed(sharded_model_path))
|
|
128
127
|
for key, value in llama_model.state_dict().items():
|
|
File without changes
|
{compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/.github/scripts/step-status
RENAMED
|
File without changes
|
{compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/.github/workflows/build-test.yml
RENAMED
|
File without changes
|
{compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/.github/workflows/build.yml
RENAMED
|
File without changes
|
|
File without changes
|
{compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/.github/workflows/report.yml
RENAMED
|
File without changes
|
{compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/.github/workflows/upload.yml
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/examples/bitmask_compression.ipynb
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/README.md
RENAMED
|
File without changes
|
{compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/__init__.py
RENAMED
|
File without changes
|
{compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/base.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/src/compressed_tensors/logger.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_compressors/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_configs/__init__.py
RENAMED
|
File without changes
|
{compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_configs/test_base.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_linear/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
{compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_quantization/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_transform/conftest.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_utils/__init__.py
RENAMED
|
File without changes
|
{compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_utils/test_match.py
RENAMED
|
File without changes
|
{compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_utils/test_offload.py
RENAMED
|
File without changes
|
|
File without changes
|
{compressed_tensors-0.11.1a20250929 → compressed_tensors-0.12.0}/tests/test_utils/test_type.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|