PyPI - compressed-tensors - Versions diffs - 0.10.3a20250812__tar.gz → 0.10.3a20250815__tar.gz - Mend

compressed-tensors 0.10.3a20250812tar.gz → 0.10.3a20250815tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (152) hide show

{compressed_tensors-0.10.3a20250812/src/compressed_tensors.egg-info → compressed_tensors-0.10.3a20250815}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: compressed-tensors
-Version: 0.10.3a20250812
+Version: 0.10.3a20250815
 Summary: Library for utilization of compressed safetensors of neural network models
 Home-page: https://github.com/neuralmagic/compressed-tensors
 Author: Neuralmagic, Inc.

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/compressors/model_compressors/model_compressor.py RENAMED Viewed

@@ -169,7 +169,7 @@ class ModelCompressor:
         cls,
         model: Module,
         sparsity_config: Union[SparsityCompressionConfig, str, None] = None,
-        quantization_format: Optional[str] = None,
+        quantization_format: Optional[Union[str, List[str]]] = None,
     ) -> Optional["ModelCompressor"]:
         """
         Given a pytorch model and optional sparsity and/or quantization configs,
@@ -182,7 +182,6 @@ class ModelCompressor:
             algorithm
         :return: compressor for the configs, or None if model is not compressed
         """
-        # reconstruct config from schemes attached to modules
         quantization_config = QuantizationConfig.from_pretrained(
             model, format=quantization_format
         )
@@ -203,6 +202,9 @@ class ModelCompressor:
             sparsity_config=sparsity_config,
             quantization_config=quantization_config,
             transform_config=transform_config,
+            compression_formats=[quantization_format]
+            if isinstance(quantization_format, str)
+            else quantization_format,
         )
     @staticmethod
@@ -263,19 +265,39 @@ class ModelCompressor:
         return quantization_config
+    def _fetch_unique_quantization_formats(self) -> List[str]:
+        """
+        Get all unique compression formats present in a model.
+        :return: list of quantization formats
+        """
+        quantization_formats = []
+        for _, scheme in self.quantization_config.config_groups.items():
+            if scheme.format is not None and scheme.format not in quantization_formats:
+                quantization_formats.append(scheme.format)
+        if (
+            len(quantization_formats) == 0
+            and self.quantization_config.format
+            != CompressionFormat.mixed_precision.value
+        ):
+            quantization_formats.append(self.quantization_config.format)
+        return quantization_formats
     def __init__(
         self,
         sparsity_config: Optional[SparsityCompressionConfig] = None,
         quantization_config: Optional[QuantizationConfig] = None,
         transform_config: Optional[TransformConfig] = None,
+        compression_formats: Optional[List[str]] = None,
     ):
         self.sparsity_config = sparsity_config
         self.quantization_config = quantization_config
         self.transform_config = transform_config
+        self.compression_formats = compression_formats
         self.sparsity_compressor = None
         self.quantization_compressor: Optional[
-            Union[BaseQuantizationCompressor, DenseCompressor]
+            Dict[str, Union[BaseQuantizationCompressor, DenseCompressor]]
         ] = None
         # no transform compressor is required
@@ -283,10 +305,21 @@ class ModelCompressor:
             self.sparsity_compressor = BaseCompressor.load_from_registry(
                 sparsity_config.format, config=sparsity_config
             )
         if quantization_config is not None:
-            self.quantization_compressor = BaseCompressor.load_from_registry(
-                quantization_config.format, config=quantization_config
-            )
+            # If a list of compression_format is not provided, we resolve the
+            # relevant quantization formats using the config groups from the config
+            # and if those are not defined, we fall-back to the global quantization format
+            if not self.compression_formats:
+                self.compression_formats = self._fetch_unique_quantization_formats()
+            self.quantization_compressor = {}
+            for format in self.compression_formats:
+                self.quantization_compressor[
+                    format
+                ] = BaseCompressor.load_from_registry(
+                    format, config=quantization_config
+                )
     # ----- used by hf quantizer ----- #
@@ -381,12 +414,13 @@ class ModelCompressor:
                     targets=scheme.targets,
                     ignore=self.quantization_config.ignore,
                 )
-                unexpected_keys.update(
-                    merge_names(target, param)
-                    for target in quant_targets
-                    for param in self.quantization_compressor.compression_param_names
-                    if param != "weight"
-                )
+                for quant_compressor in self.quantization_compressor.values():
+                    unexpected_keys.update(
+                        merge_names(target, param)
+                        for target in quant_targets
+                        for param in quant_compressor.compression_param_names
+                        if param != "weight"
+                    )
         return list(unexpected_keys)
@@ -424,7 +458,21 @@ class ModelCompressor:
                 # quantization first
                 if prefix in module_to_scheme:
-                    state_dict = self.quantization_compressor.compress(
+                    if (
+                        not hasattr(module.quantization_scheme, "format")
+                        or module.quantization_scheme.format is None
+                    ):
+                        if len(self.compression_formats) > 1:
+                            raise ValueError(
+                                "Applying multiple compressors without defining "
+                                "per module formats is not supported "
+                            )
+                        format = self.compression_formats[0]
+                    else:
+                        format = module.quantization_scheme.format
+                    quant_compressor = self.quantization_compressor.get(format)
+                    state_dict = quant_compressor.compress(
                         state_dict,
                         names_to_scheme=module_to_scheme,
                         show_progress=False,
@@ -495,12 +543,24 @@ class ModelCompressor:
                 # quantization second
                 if prefix in module_to_scheme:
-                    state_dict = (
-                        self.quantization_compressor.decompress_module_from_state_dict(
-                            prefix,
-                            state_dict,
-                            scheme=module_to_scheme[prefix],
-                        )
+                    if (
+                        not hasattr(module.quantization_scheme, "format")
+                        or module.quantization_scheme.format is None
+                    ):
+                        if len(self.compression_formats) > 1:
+                            raise ValueError(
+                                "Applying multiple compressors without defining "
+                                "per module formats is not supported "
+                            )
+                        format = self.compression_formats[0]
+                    else:
+                        format = module.quantization_scheme.format
+                    quant_compressor = self.quantization_compressor.get(format)
+                    state_dict = quant_compressor.decompress_module_from_state_dict(
+                        prefix,
+                        state_dict,
+                        scheme=module_to_scheme[prefix],
                     )
                 # remove any existing parameters
@@ -539,7 +599,9 @@ class ModelCompressor:
         if self.quantization_compressor is not None:
             module_to_scheme = map_module_to_scheme(model)
-            state_dict = self.quantization_compressor.compress(
+            # Note - compress only supports one compression format atm
+            quant_compressor = next(iter(self.quantization_compressor.values()))
+            state_dict = quant_compressor.compress(
                 state_dict,
                 names_to_scheme=module_to_scheme,
                 show_progress=show_progress,
@@ -588,14 +650,20 @@ class ModelCompressor:
         """
         model_path = get_safetensors_folder(model_path)
         sparse_decompressed = False
+        quant_compressor = (
+            next(iter(self.quantization_compressor.values()))
+            if self.quantization_compressor is not None
+            else None
+        )
         if (
             self.sparsity_compressor is not None
             and self.sparsity_config.format != CompressionFormat.dense.value
         ):
+            # note - decompress only supports one compressor atm
             params_to_ignore = None
-            if self.quantization_compressor is not None:
-                params_to_ignore = self.quantization_compressor.compression_param_names
+            if quant_compressor is not None:
+                params_to_ignore = quant_compressor.compression_param_names
             # Sparse decompression is applied on the model_path
             # The compressor will try and load any quantization parameters as well
             # params_to_skip_load will skip over quantization params from being loaded
@@ -606,7 +674,7 @@ class ModelCompressor:
             setattr(model, SPARSITY_CONFIG_NAME, self.sparsity_compressor.config)
             sparse_decompressed = True
-        if self.quantization_compressor is not None:
+        if quant_compressor is not None:
             # Temporarily set quantization status to FROZEN to prevent
             # quantization during apply_quantization_config. This ensures
             # that the dtypes of the weights are not unintentionally updated.
@@ -629,7 +697,7 @@ class ModelCompressor:
                     # including initialization
                     load_weight_quantization=(
                         sparse_decompressed
-                        or isinstance(self.quantization_compressor, DenseCompressor)
+                        or isinstance(quant_compressor, DenseCompressor)
                     ),
                 )
@@ -637,7 +705,7 @@ class ModelCompressor:
                 model.state_dict() if sparse_decompressed else model_path
             )
-            dense_gen = self.quantization_compressor.decompress(
+            dense_gen = quant_compressor.decompress(
                 model_path_or_state_dict, names_to_scheme=names_to_scheme
             )
             # TODO: all weight quantization params will be moved to the compressor

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/config/base.py RENAMED Viewed

@@ -32,6 +32,7 @@ class CompressionFormat(Enum):
     naive_quantized = "naive-quantized"
     pack_quantized = "pack-quantized"
     marlin_24 = "marlin-24"
+    mixed_precision = "mixed-precision"
     nvfp4_pack_quantized = "nvfp4-pack-quantized"

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/quantization/quant_config.py RENAMED Viewed

@@ -234,6 +234,12 @@ class QuantizationConfig(BaseModel):
                 format = CompressionFormat.int_quantized.value
             else:
                 format = CompressionFormat.dense.value
+        elif isinstance(format, list):
+            format = (
+                CompressionFormat.mixed_precision.value
+                if len(format) > 1
+                else format[0]
+            )
         return QuantizationConfig(
             config_groups=config_groups,

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/quantization/quant_scheme.py RENAMED Viewed

@@ -16,6 +16,7 @@ import warnings
 from copy import deepcopy
 from typing import List, Optional
+from compressed_tensors.config import CompressionFormat
 from compressed_tensors.quantization.quant_args import (
     DynamicType,
     QuantizationArgs,
@@ -42,18 +43,21 @@ class QuantizationScheme(BaseModel):
     :param weights: quantization config for layer weights
     :param input_activations: quantization config for layer inputs
     :param output_activations: quantization config for layer outputs
+    :param format: CompressionFormat for the layer
     """
     targets: List[str]
     weights: Optional[QuantizationArgs] = None
     input_activations: Optional[QuantizationArgs] = None
     output_activations: Optional[QuantizationArgs] = None
+    format: Optional[str] = None
     @model_validator(mode="after")
     def validate_model_after(model: "QuantizationScheme") -> "QuantizationScheme":
         inputs = model.input_activations
         outputs = model.output_activations
         weights = model.weights
+        format = model.format
         if inputs is not None:
             if inputs.actorder is not None:
@@ -63,6 +67,11 @@ class QuantizationScheme(BaseModel):
             if outputs.actorder is not None:
                 raise ValueError("Cannot apply actorder to output activations")
+        if format == CompressionFormat.mixed_precision.value:
+            raise ValueError(
+                "mixed-precision cannot be set as a format for a QuantizationScheme"
+            )
         if (
             inputs
             and weights

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/utils/match.py RENAMED Viewed

@@ -15,7 +15,7 @@
 import logging
 import re
 from collections.abc import Generator
-from typing import Iterable, Mapping, Optional, Tuple
+from typing import Iterable, List, Mapping, Optional, Tuple, Union
 import torch
 from compressed_tensors.utils.internal import InternalModule
@@ -57,10 +57,10 @@ def match_named_modules(
     unmatched_targets = set(targets)
     for name, module in model.named_modules():
         for target in targets:
-            if is_match(name, module, target, fused):
+            if is_match(name, module, target, fused=fused):
                 unmatched_targets -= {target}
-                if not any(is_match(name, module, ign, fused) for ign in ignore):
+                if not is_match(name, module, ignore, fused=fused):
                     yield name, module
     if warn_on_fail:
@@ -155,9 +155,7 @@ def match_modules_set(
     for name, module in model.named_modules():
         # match until we get a full set
         for target in targets:
-            if is_match(name, module, target) and not any(
-                is_match(name, module, ign) for ign in ignore
-            ):
+            if is_match(name, module, target, ignore):
                 if matches[target] is not None:
                     raise ValueError(f"Matched a {target} twice before completing set")
                 matches[target] = module
@@ -176,7 +174,8 @@ def match_modules_set(
 def is_match(
     name: str,
     module: torch.nn.Module,
-    target: str,
+    targets: Union[str, Iterable[str]],
+    ignore: Union[str, Iterable[str]] = tuple(),
     fused: Optional[FusedMappping] = None,
 ) -> bool:
     """
@@ -198,8 +197,17 @@ def is_match(
     :fused: optional mapping from suffixes of fused modules to the suffixes of their
         corresponding shards
     """
+    targets = [targets] if isinstance(targets, str) else targets
+    ignore = [ignore] if isinstance(ignore, str) else ignore
     return not isinstance(module, InternalModule) and (
-        _match_name(name, target, fused) or _match_class(module, target)
+        any(
+            _match_name(name, target, fused) or _match_class(module, target)
+            for target in targets
+        )
+        and not any(
+            _match_name(name, ign, fused) or _match_class(module, ign) for ign in ignore
+        )
     )

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/version.py RENAMED Viewed

@@ -17,5 +17,5 @@ __version__: str
 __version_tuple__: VERSION_TUPLE
 version_tuple: VERSION_TUPLE
-__version__ = version = '0.10.3.a20250812'
+__version__ = version = '0.10.3.a20250815'
 __version_tuple__ = version_tuple = (0, 10, 3)

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815/src/compressed_tensors.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: compressed-tensors
-Version: 0.10.3a20250812
+Version: 0.10.3a20250815
 Summary: Library for utilization of compressed safetensors of neural network models
 Home-page: https://github.com/neuralmagic/compressed-tensors
 Author: Neuralmagic, Inc.

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_compressors/model_compressors/test_model_compressor.py RENAMED Viewed

@@ -20,8 +20,12 @@ import pytest
 import torch
 import torch.nn as nn
 from compressed_tensors.compressors import ModelCompressor
-from compressed_tensors.config import SparsityCompressionConfig
-from compressed_tensors.quantization import QuantizationConfig
+from compressed_tensors.config import CompressionFormat, SparsityCompressionConfig
+from compressed_tensors.quantization import (
+    QuantizationArgs,
+    QuantizationConfig,
+    QuantizationScheme,
+)
 from safetensors.torch import save_file
 from tests.testing_utils import induce_sparsity, requires_hf_quantizer
 from transformers import AutoModelForCausalLM
@@ -395,7 +399,7 @@ def _get_combined_config(s_config, q_config):
 )
 def test_compress_model(model_stub, q_format, s_config, tmpdir):
     model = AutoModelForCausalLM.from_pretrained(model_stub, torch_dtype=torch.float32)
-    compressor = ModelCompressor.from_pretrained_model(model, s_config, q_format)
+    compressor = ModelCompressor.from_pretrained_model(model, s_config, [q_format])
     # compress model by eagerly compressing state dict
     true_compressed = dict(compressor.compress(model))
@@ -443,7 +447,7 @@ def test_compress_model_meta(model_stub, q_format, s_config):
         model_stub, torch_dtype=torch.float32
     )
     reference_compressor = ModelCompressor.from_pretrained_model(
-        cpu_model, s_config, q_format
+        cpu_model, s_config, [q_format]
     )
     # Only stores dtype because meta model does not store values
     expected = {k: v.dtype for k, v in reference_compressor.compress(cpu_model).items()}
@@ -459,7 +463,7 @@ def test_compress_model_meta(model_stub, q_format, s_config):
             module.to_empty(device="meta")
     # Compress in-place on meta model
-    compressor = ModelCompressor.from_pretrained_model(meta_model, s_config, q_format)
+    compressor = ModelCompressor.from_pretrained_model(meta_model, s_config, [q_format])
     compressor.compress_model(meta_model)
     # Compare keys and dtypes
@@ -469,6 +473,43 @@ def test_compress_model_meta(model_stub, q_format, s_config):
         assert compressed[key].dtype == dtype, f"{key} has incorrect dtype"
+def test_multiple_quant_compressors():
+    model = torch.nn.Sequential(torch.nn.Linear(1, 2), torch.nn.Linear(2, 3))
+    input_activations = QuantizationArgs(num_bits=8, type="float")
+    weights = QuantizationArgs(num_bits=8, type="float")
+    scheme_fp8 = QuantizationScheme(
+        targets=["Linear"],
+        weights=weights,
+        input_activations=input_activations,
+        format=CompressionFormat.float_quantized.value,
+    )
+    input_activations = QuantizationArgs(num_bits=4, type="float")
+    weights = QuantizationArgs(num_bits=4, type="float")
+    scheme_nvfp4 = QuantizationScheme(
+        targets=["Linear"],
+        weights=weights,
+        input_activations=input_activations,
+        format=CompressionFormat.nvfp4_pack_quantized.value,
+    )
+    model[0].quantization_scheme = scheme_fp8
+    model[0].quantization_status = "frozen"
+    model[1].quantization_scheme = scheme_nvfp4
+    model[1].quantization_status = "frozen"
+    formats = [scheme_fp8.format, scheme_nvfp4.format]
+    compressor = ModelCompressor.from_pretrained_model(model, None, formats)
+    assert isinstance(compressor.quantization_compressor, dict)
+    assert (
+        compressor.quantization_config.format == CompressionFormat.mixed_precision.value
+    )
+    assert all(format in compressor.quantization_compressor for format in formats)
 @pytest.mark.parametrize(
     "model_stub,comp_stub",
     [

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_quantization/test_quant_scheme.py RENAMED Viewed

@@ -26,12 +26,13 @@ def test_basic_scheme():
     assert scheme.weights == weights
     assert scheme.input_activations is None
     assert scheme.output_activations is None
+    assert scheme.format is None
 def test_full_scheme():
     targets = ["Linear"]
     weights = QuantizationArgs()
-    input_activations = QuantizationArgs(num_bits=4)
+    input_activations = QuantizationArgs(num_bits=8)
     output_activations = QuantizationArgs(num_bits=8, type="float", symmetric=False)
     scheme = QuantizationScheme(
@@ -39,11 +40,13 @@ def test_full_scheme():
         weights=weights,
         input_activations=input_activations,
         output_activations=output_activations,
+        format="float-quantized",
     )
     assert scheme.targets == targets
     assert scheme.weights == weights
     assert scheme.input_activations == input_activations
     assert scheme.output_activations == output_activations
+    assert scheme.format is "float-quantized"
 def test_needs_targets():
@@ -57,3 +60,4 @@ def test_defaults():
     assert output.weights is None
     assert output.input_activations is None
     assert output.output_activations is None
+    assert output.format is None

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_utils/test_match.py RENAMED Viewed

@@ -201,14 +201,20 @@ class TestIsMatch:
             "gate_up_proj": ["gate_proj", "up_proj"],
         }
-        assert is_match("dummy.qkv_proj", linear, "re:.*q_proj", mapping) == True
-        assert is_match("dummy.qkv_proj", linear, "re:.*k_proj", mapping) == True
-        assert is_match("dummy.qkv_proj", linear, "re:.*v_proj", mapping) == True
-        assert is_match("dummy.qkv_proj", linear, "Linear", mapping) == True
-        assert is_match("dummy.gate_up_proj", linear, "re:.*gate_proj", mapping) == True
-        assert is_match("dummy.gate_up_proj", linear, "re:.*up_proj", mapping) == True
-        assert is_match("dummy.gate_up_proj", linear, "Linear", mapping) == True
+        assert is_match("dummy.qkv_proj", linear, "re:.*q_proj", fused=mapping) == True
+        assert is_match("dummy.qkv_proj", linear, "re:.*k_proj", fused=mapping) == True
+        assert is_match("dummy.qkv_proj", linear, "re:.*v_proj", fused=mapping) == True
+        assert is_match("dummy.qkv_proj", linear, "Linear", fused=mapping) == True
+        assert (
+            is_match("dummy.gate_up_proj", linear, "re:.*gate_proj", fused=mapping)
+            == True
+        )
+        assert (
+            is_match("dummy.gate_up_proj", linear, "re:.*up_proj", fused=mapping)
+            == True
+        )
+        assert is_match("dummy.gate_up_proj", linear, "Linear", fused=mapping) == True
 class TestMatchNamedModules:

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/.github/.gitkeep RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/.github/actions/test/action.yml RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/.github/scripts/step-status RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/.github/workflows/build-test.yml RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/.github/workflows/build.yml RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/.github/workflows/report.yml RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/.github/workflows/test-check.yaml RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/.github/workflows/test.yml RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/.github/workflows/trigger-all.yml RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/.github/workflows/upload.yml RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/.gitignore RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/LICENSE RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/Makefile RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/README.md RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/examples/bit_packing/ex_quantize_and_pack.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/examples/bit_packing/int4_config.json RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/examples/bitmask_compression.ipynb RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/examples/llama_1.1b/ex_config_quantization.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/examples/llama_1.1b/ex_llmcompressor_quantization.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/examples/llama_1.1b/example_quant_config.json RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/examples/llama_1.1b/example_quant_recipe.yaml RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/examples/quantize_and_pack_int4.ipynb RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/pyproject.toml RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/setup.cfg RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/setup.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/README.md RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/base.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/compressors/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/compressors/base.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/compressors/helpers.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/compressors/model_compressors/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/compressors/quantized_compressors/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/compressors/quantized_compressors/base.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/compressors/quantized_compressors/naive_quantized.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/compressors/quantized_compressors/nvfp4_quantized.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/compressors/quantized_compressors/pack_quantized.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/compressors/sparse_compressors/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/compressors/sparse_compressors/base.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/compressors/sparse_compressors/dense.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/compressors/sparse_compressors/sparse_24_bitmask.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/compressors/sparse_compressors/sparse_bitmask.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/compressors/sparse_quantized_compressors/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/compressors/sparse_quantized_compressors/marlin_24.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/config/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/config/dense.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/config/sparse_24_bitmask.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/config/sparse_bitmask.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/linear/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/linear/compressed_linear.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/quantization/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/quantization/lifecycle/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/quantization/lifecycle/apply.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/quantization/lifecycle/compressed.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/quantization/lifecycle/forward.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/quantization/lifecycle/helpers.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/quantization/lifecycle/initialize.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/quantization/quant_args.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/quantization/utils/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/quantization/utils/helpers.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/registry/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/registry/registry.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/transform/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/transform/apply.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/transform/factory/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/transform/factory/base.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/transform/factory/hadamard.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/transform/factory/matrix_multiply.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/transform/factory/random_hadamard.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/transform/transform_args.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/transform/transform_config.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/transform/transform_scheme.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/transform/utils/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/transform/utils/hadamard.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/transform/utils/hadamards.safetensors RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/transform/utils/matrix.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/utils/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/utils/helpers.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/utils/internal.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/utils/offload.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/utils/permutations_24.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/utils/permute.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/utils/safetensors_load.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/utils/semi_structured_conversions.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors/utils/type.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors.egg-info/SOURCES.txt RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors.egg-info/dependency_links.txt RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors.egg-info/requires.txt RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/src/compressed_tensors.egg-info/top_level.txt RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/conftest.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_compressors/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_compressors/model_compressors/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_compressors/quantized_compressors/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_compressors/quantized_compressors/test_fp8_quant.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_compressors/quantized_compressors/test_int_quant.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_compressors/quantized_compressors/test_nvfp4_quant.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_compressors/quantized_compressors/test_pack_quant.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_compressors/sparse_compressors/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_compressors/sparse_compressors/test_bitmask.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_compressors/sparse_compressors/test_sparse_24_bitmask.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_compressors/sparse_quantized_compressors/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_compressors/sparse_quantized_compressors/test_marlin_24.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_configs/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_configs/test_base.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_examples/test_bitmask_compression_ipynb.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_linear/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_linear/test_compressed_linear.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_quantization/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_quantization/lifecycle/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_quantization/lifecycle/conftest.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_quantization/lifecycle/test_apply.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_quantization/lifecycle/test_dynamic_lifecycle.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_quantization/lifecycle/test_enabled.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_quantization/lifecycle/test_forward.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_quantization/lifecycle/test_helpers.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_quantization/lifecycle/test_initialize.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_quantization/lifecycle/test_lifecycle.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_quantization/test_configs/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_quantization/test_configs/test_bit_depths.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_quantization/test_configs/test_strategies.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_quantization/test_quant_args.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_quantization/test_quant_config.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_quantization/test_utils/test_helpers.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_registry.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_transform/conftest.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_transform/factory/test_correctness.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_transform/factory/test_memory.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_transform/factory/test_serialization.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_transform/test_transform_args.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_transform/test_transform_config.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_transform/test_transform_scheme.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_transform/utils/test_hadamard.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_utils/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_utils/test_helpers.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_utils/test_offload.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_utils/test_safetensors_load.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/test_utils/test_type.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/tests/testing_utils.py RENAMED Viewed

File without changes

{compressed_tensors-0.10.3a20250812 → compressed_tensors-0.10.3a20250815}/utils/copyright.py RENAMED Viewed

File without changes

compressed-tensors 0.10.3a20250812__tar.gz → 0.10.3a20250815__tar.gz

compressed-tensors 0.10.3a20250812tar.gz → 0.10.3a20250815tar.gz