PyPI - compressed-tensors - Versions diffs - 0.12.3a20251114__tar.gz → 0.12.3a20251203__tar.gz - Mend

compressed-tensors 0.12.3a20251114tar.gz → 0.12.3a20251203tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (158) hide show

{compressed_tensors-0.12.3a20251114/src/compressed_tensors.egg-info → compressed_tensors-0.12.3a20251203}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: compressed-tensors
-Version: 0.12.3a20251114
+Version: 0.12.3a20251203
 Summary: Library for utilization of compressed safetensors of neural network models
 Home-page: https://github.com/vllm-project/compressed-tensors
 Author: Neuralmagic, Inc.

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/utils/match.py RENAMED Viewed

@@ -13,7 +13,9 @@
 # limitations under the License.
 import logging
+import os
 import re
+from collections import defaultdict
 from collections.abc import Generator
 from typing import Iterable, List, Mapping, Optional, Tuple, Union
@@ -29,6 +31,7 @@ __all__ = [
     "match_named_parameters",
     "match_targets",
     "match_modules_set",
+    "get_lowest_common_ancestor_name",
     "is_match",
     "is_narrow_match",
 ]
@@ -157,34 +160,68 @@ def match_targets(
     return matched_targets
+def get_lowest_common_ancestor_name(names: list[str | None]) -> str:
+    """
+    Given a list of names, returns the lowest-scope common name ignoring Nones.
+    Implementation is a small alteration of os.path.commonprefix
+    https://docs.python.org/3/library/os.path.html#os.path.commonprefix
+    ([s1, s2]->prefix->result)
+    # case 0: multiple modules: [abc.a., abc.b.] -> .abc. -> abc
+    # case 1: single module: [abc.] -> .abc. -> abc
+    # case 2: substring modules: [abc., ab.] -> .ab -> ""
+    # case 3: parent & child: [ab., ab.a.] -> .ab. -> ab
+    """
+    names = [name for name in names if name is not None]
+    if len(names) == 0:
+        return ""
+    # 1) find longest shared prefix
+    s1 = "." + min(names) + "."
+    s2 = "." + max(names) + "."
+    common_prefix = os.path.commonprefix([s1, s2])
+    # 2) throw away right most dot and name fragment, throw away leftmost char
+    # ".keep.thro" -> "keep", "." -> ""
+    return common_prefix[1 : common_prefix.rfind(".")]
 def match_modules_set(
     model: torch.nn.Module,
     targets: Optional[Iterable[str]],
     ignore: Optional[Iterable[str]] = None,
-) -> Generator[Iterable[torch.nn.Module]]:
+    error_on_module_rematch: bool = True,
+) -> Generator[List[List[torch.nn.Module]]]:
     """
-    Yields modules grouped with the same order and size as `targets`.
-    Values are returned in order of `model.named_modules()`
+    Yields modules grouped by parent context.
+    We group by parent context so that we can return ALL matches of a
+    specific target that can be paired with another target. This is most
+    relevant in the case of MoE modules with multiple modules for each
+    expert i.e. post_attention_layernorm <-> mlp.expert.N.gate_proj,
+    mlp.expert.N.up_proj for all N. The parent context will differ from
+    one layer to another while being the same for one expert to another.
-    E.g. the following targets would yield module belonging to the following layers:
+    Each returned group is a list (of lists) with the same size
+    and order as `targets` while all matches for each target and
+    the overall order of the groups are ordered in the same way
+    as `model.named_modules`
+    E.g. the following targets would yield modules belonging to the following layers:
     ```python3
     match_modules_set(model, ["q_proj", "k_proj", "v_proj"]) == (
-        (
-            `model.layers.0.self_attn.q_proj`,
-            `model.layers.0.self_attn.k_proj`,
-            `model.layers.0.self_attn.v_proj`,
-        ),
-        (
-            `model.layers.1.self_attn.q_proj`,
-            `model.layers.1.self_attn.k_proj`,
-            `model.layers.1.self_attn.v_proj`,
-        ),
+        [
+            [`layers.0.self_attn.q_proj`],
+            [`layers.0.self_attn.k_proj`],
+            [`layers.0.self_attn.v_proj`],
+        ],
+        [
+            [`layers.1.self_attn.q_proj`],
+            [`layers.1.self_attn.k_proj`],
+            [`layers.1.self_attn.v_proj`],
+        ],
         ...
-        (
-            `model.layers.32.self_attn.q_proj`,
-            `model.layers.32.self_attn.k_proj`,
-            `model.layers.32.self_attn.v_proj`,
-        ),
     )
     ```
@@ -192,33 +229,125 @@ def match_modules_set(
     For example, matching layer norms to their subsequent linear layers
     ```python3
     for norm, q, k, v in match_modules_set(model, (norm_tgt, q_tgt, k_tgt, v_tgt)):
-        fuse_norm_linears(norm, [q, k, v])
+        fuse_norm_linears(*norm, [*q, *k, *v])
+    ```
+    Alternatively for MoE you would get multiple matches
+    per target per group, E.g.
+    ```python3
+    targets = [
+        "post_attention_layernorm",
+        "up_proj",
+        "down_proj"
+    ]
+    match_modules_set(model, targets) == (
+        [
+            [layers.0.post_attention_layernorm],
+            [
+                `layers.0.mlp.experts.0.up_proj`,
+                `layers.0.mlp.experts.1.up_proj`,
+                ...
+            ],
+            [
+                `layers.0.mlp.experts.0.down_proj`,
+                `layers.0.mlp.experts.1.down_proj`,
+                ...
+            ]
+        ], # <- first yield
+        [
+            [layers.1.post_attention_layernorm],
+            [
+                `layers.1.mlp.experts.0.up_proj`,
+                `layers.1.mlp.experts.1.up_proj`,
+                ...
+            ],
+            [
+                `layers.1.mlp.experts.0.down_proj`,
+                `layers.1.mlp.experts.1.down_proj`,
+                ...
+            ]
+        ],
+        ...
+    )
+    ```
     :param model: model containing modules to match against
     :param targets: target strings, potentially containing "re:" prefixes
     :param ignore: targets to ignore, potentially containing "re:" prefixes
+    :param error_on_module_rematch: if True, errors when a module gets
+      matched to multiple targets, if False, no error. (Defaults to True)
     """
     targets = targets or []
     ignore = ignore or []
-    matches = dict.fromkeys(targets, None)
+    # as we iterate through modules and try to match them with targets,
+    # the algorithm can be in 2 possible states:
+    # 0) unmatched_targets > 0, i.e. some of the targets haven't been matched.
+    #   Keep matching until all targets have at least one match
+    # 1) unmatched_targets == 0 i.e. we have at least one match for each target.
+    #   At this point we are unsure if we have a full set or if we need to add
+    #   more matches.
+    # There are 3 things that can happen once were in state 1:
+    # A) found a new match with same parent_context,
+    #   (add it to matches and keep going)
+    # B) found a new match with different parent_context, i.e. we found a match
+    #   that requires a deeper parent context, this indicates that this match
+    #   should be part of a new set.
+    #   (yield current set [not including newest match] and go back to state 0)
+    # C) ran out of modules, we will always yield the final remaining set when
+    #   we we've iterated through all the modules in the model.
+    #   (yield final set then exit.)
+    # Note: its possible to iterate through all the modules in the model while
+    #   not having a full matched set if the user specified a bad matching, in
+    #   that case something has gone wrong and we error
+    matches = defaultdict(list)
+    parent_context = None
+    unmatched_targets = set(targets)
     for name, module in model.named_modules():
-        # match until we get a full set
+        matched_targets_for_cur_module = set()
         for target in targets:
             if is_match(name, module, target, ignore):
-                if matches[target] is not None:
-                    raise ValueError(f"Matched a {target} twice before completing set")
-                matches[target] = module
-        # once we have a full set, yield and reset
-        if targets and all((matches[target] is not None for target in targets)):
-            yield [matches[target] for target in targets]  # ensure correct ordering
-            matches = dict.fromkeys(targets, None)
-    # check that none are left over
-    unmatched_keys = [match for match, value in matches.items() if value is not None]
-    if len(unmatched_keys):
-        raise ValueError(f"Unable to match targets into set: {unmatched_keys}")
+                new_parent_context = get_lowest_common_ancestor_name(
+                    [name, parent_context]
+                )
+                # code for (B)
+                if not unmatched_targets and new_parent_context != parent_context:
+                    yield [matches[target] for target in targets]
+                    matches = defaultdict(list)
+                    new_parent_context = name
+                    unmatched_targets = set(targets)
+                matches[target].append(module)
+                parent_context = new_parent_context
+                unmatched_targets -= {target}
+                matched_targets_for_cur_module |= {target}
+        if len(matched_targets_for_cur_module) > 1 and error_on_module_rematch:
+            raise ValueError(
+                f"module: {name} was matched with multiple targets: "
+                f"{matched_targets_for_cur_module} which is unexpected "
+                "disable this check by setting `error_on_module_rematch = False`"
+            )
+    # never found anything
+    if unmatched_targets == set(targets):
+        return
+    # code for (C)
+    if not unmatched_targets:  # have a full matching
+        yield [matches[target] for target in targets]
+        return
+    raise ValueError(
+        f"Found a final incomplete set with matches found for keys: "
+        f"{set(targets) - unmatched_targets} "
+        f"but no matches found for keys: {unmatched_targets}"
+    )
 def is_match(

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/version.py RENAMED Viewed

@@ -17,5 +17,5 @@ __version__: str
 __version_tuple__: VERSION_TUPLE
 version_tuple: VERSION_TUPLE
-__version__ = version = '0.12.3.a20251114'
+__version__ = version = '0.12.3.a20251203'
 __version_tuple__ = version_tuple = (0, 12, 3)

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203/src/compressed_tensors.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: compressed-tensors
-Version: 0.12.3a20251114
+Version: 0.12.3a20251203
 Summary: Library for utilization of compressed safetensors of neural network models
 Home-page: https://github.com/vllm-project/compressed-tensors
 Author: Neuralmagic, Inc.

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_utils/test_match.py RENAMED Viewed

@@ -20,6 +20,7 @@ import torch.nn as nn
 # Assuming the module is named "module_matching" - adjust import as needed
 from compressed_tensors.utils import (
     InternalModule,
+    get_lowest_common_ancestor_name,
     is_match,
     is_narrow_match,
     match_modules_set,
@@ -79,6 +80,39 @@ class DummyModel(nn.Module):
             )
+class DummyMoEModel(nn.Module):
+    """Test MoE model for unit tests. Weights are initialized on meta device"""
+    def __init__(self, num_layers=2, num_experts=4):
+        super().__init__()
+        self.layers = nn.ModuleList(
+            [
+                nn.ModuleDict(
+                    {
+                        "post_attention_layernorm": nn.LayerNorm(3),
+                        "mlp": nn.ModuleDict(
+                            {
+                                "experts": nn.ModuleList(
+                                    [
+                                        nn.ModuleDict(
+                                            {
+                                                "gate_proj": nn.Linear(3, 6),
+                                                "up_proj": nn.Linear(3, 6),
+                                                "down_proj": nn.Linear(6, 3),
+                                            }
+                                        )
+                                        for _ in range(num_experts)
+                                    ]
+                                ),
+                            }
+                        ),
+                    }
+                )
+                for _ in range(num_layers)
+            ]
+        )
 class TestMatchName:
     """Test cases for _match_name function"""
@@ -412,6 +446,58 @@ class TestMatchNamedParameters:
         assert len(matches) == 0
+class TestGetLowestCommonModuleName:
+    """Test cases for get_lowest_common_ancestor_name function"""
+    def test_multiple_modules(self):
+        assert "abc" == get_lowest_common_ancestor_name(
+            [
+                "abc.a",
+                "abc.b",
+                "abc.c",
+            ]
+        )
+    def test_single_module(self):
+        assert "abc.abc" == get_lowest_common_ancestor_name(
+            [
+                "abc.abc",
+            ]
+        )
+    def test_substring_modules(self):
+        assert "abc" == get_lowest_common_ancestor_name(
+            [
+                "abc.abc",
+                "abc.ab",
+            ]
+        )
+    def test_parent_and_child_modules(self):
+        assert "abc.abc" == get_lowest_common_ancestor_name(
+            [
+                "abc.abc.ab",
+                "abc.abc",
+            ]
+        )
+    def test_root(self):
+        assert "" == get_lowest_common_ancestor_name(
+            [
+                "abc.abc",
+                "b.abc",
+            ]
+        )
+    def test_ignore_none(self):
+        assert "abc.abc" == get_lowest_common_ancestor_name(
+            [
+                "abc.abc",
+                None,
+            ]
+        )
 class TestMatchModulesSet:
     """Test cases for match_modules_set function"""
@@ -432,7 +518,71 @@ class TestMatchModulesSet:
         # Each set should have 3 modules
         for module_set in matches:
             assert len(module_set) == 3
-            assert all(isinstance(m, nn.Linear) for m in module_set)
+            assert all(isinstance(*m, nn.Linear) for m in module_set)
+    def test_moe_module_match(self):
+        """Test matching MoE modules with multiple experts per layer"""
+        model = DummyMoEModel(num_layers=2, num_experts=4)
+        # Test matching expert projections - each expert becomes its own set
+        # because the parent context differs between experts
+        targets = [
+            "re:.*gate_proj$",
+            "re:.*up_proj$",
+        ]
+        matches = list(match_modules_set(model, targets))
+        # Should have 8 sets (2 layers * 4 experts)
+        assert len(matches) == 8
+        # Each set should have 2 target lists (gate_proj, up_proj)
+        for expert_group in matches:
+            assert len(expert_group) == 2
+            gate_modules, up_modules = expert_group
+            # Each target should have matched 1 module (single expert)
+            assert len(gate_modules) == 1
+            assert len(up_modules) == 1
+            # All modules should be Linear layers
+            assert isinstance(gate_modules[0], nn.Linear)
+            assert isinstance(up_modules[0], nn.Linear)
+    def test_moe_with_layernorm_match(self):
+        """
+        Test matching MoE modules with their corresponding layer norms.
+        Including a layer-level module (layernorm) groups all experts in
+        that layer together.
+        """
+        model = DummyMoEModel(num_layers=2, num_experts=3)
+        # Match layer norm with expert projections - the layernorm is at layer level,
+        # so it establishes a common parent context for all experts in that layer
+        targets = [
+            "re:.*post_attention_layernorm$",
+            "re:.*gate_proj$",
+            "re:.*up_proj$",
+        ]
+        matches = list(match_modules_set(model, targets))
+        # Should have 2 layer groups (one per layer)
+        assert len(matches) == 2
+        for layer_group in matches:
+            assert len(layer_group) == 3
+            norm_modules, gate_modules, up_modules = layer_group
+            # LayerNorm should have 1 module (single per layer)
+            assert len(norm_modules) == 1
+            assert isinstance(norm_modules[0], nn.LayerNorm)
+            # Each projection should have 3 experts (all experts in the layer)
+            assert len(gate_modules) == 3
+            assert len(up_modules) == 3
+            assert all(isinstance(m, nn.Linear) for m in gate_modules)
+            assert all(isinstance(m, nn.Linear) for m in up_modules)
     def test_module_set_ordering(self):
         """Test that module sets maintain target ordering"""
@@ -448,6 +598,7 @@ class TestMatchModulesSet:
         for module_set in matches:
             # Check that modules are returned in target order (v, q, k)
             v_proj, q_proj, k_proj = module_set
+            v_proj, q_proj, k_proj = *v_proj, *q_proj, *k_proj
             # We can't easily check the exact modules, but can check they're all Linear
             assert all(isinstance(m, nn.Linear) for m in [v_proj, q_proj, k_proj])
@@ -456,18 +607,8 @@ class TestMatchModulesSet:
         model = DummyModel()
         targets = ["layer1", "nonexistent_module"]
-        with pytest.raises(ValueError, match="Unable to match targets into set"):
-            list(match_modules_set(model, targets))
-    def test_duplicate_match_error(self):
-        """Test error when same target matches multiple times before set completion"""
-        model = DummyModel()
-        # This should cause the same target to match multiple times
-        # before we can complete a set
-        targets = ["Linear", "Linear"]  # Two identical targets
         with pytest.raises(
-            ValueError, match="Matched a .* twice before completing set"
+            ValueError, match="Found a final incomplete set with matches found for keys"
         ):
             list(match_modules_set(model, targets))

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/.github/.gitkeep RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/.github/actions/test/action.yml RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/.github/scripts/step-status RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/.github/workflows/quality-check.yaml RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/.github/workflows/test-check.yaml RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/.gitignore RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/LICENSE RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/Makefile RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/README.md RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/examples/bit_packing/ex_quantize_and_pack.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/examples/bit_packing/int4_config.json RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/examples/bitmask_compression.ipynb RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/examples/llama_1.1b/ex_config_quantization.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/examples/llama_1.1b/ex_llmcompressor_quantization.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/examples/llama_1.1b/example_quant_config.json RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/examples/llama_1.1b/example_quant_recipe.yaml RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/examples/quantize_and_pack_int4.ipynb RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/pyproject.toml RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/setup.cfg RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/setup.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/README.md RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/base.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/compressors/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/compressors/base.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/compressors/helpers.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/compressors/model_compressors/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/compressors/model_compressors/model_compressor.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/compressors/quantized_compressors/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/compressors/quantized_compressors/base.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/compressors/quantized_compressors/fp4_quantized.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/compressors/quantized_compressors/naive_quantized.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/compressors/quantized_compressors/pack_quantized.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/compressors/sparse_compressors/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/compressors/sparse_compressors/base.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/compressors/sparse_compressors/dense.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/compressors/sparse_compressors/sparse_24_bitmask.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/compressors/sparse_compressors/sparse_bitmask.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/compressors/sparse_quantized_compressors/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/compressors/sparse_quantized_compressors/marlin_24.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/config/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/config/base.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/config/dense.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/config/format.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/config/sparse_24_bitmask.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/config/sparse_bitmask.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/linear/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/linear/compressed_linear.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/logger.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/modeling/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/modeling/attention.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/modeling/kvcache.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/quantization/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/quantization/lifecycle/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/quantization/lifecycle/apply.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/quantization/lifecycle/compressed.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/quantization/lifecycle/forward.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/quantization/lifecycle/helpers.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/quantization/lifecycle/initialize.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/quantization/quant_args.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/quantization/quant_config.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/quantization/quant_metadata.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/quantization/quant_scheme.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/quantization/utils/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/quantization/utils/helpers.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/quantization/utils/mxfp4_utils.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/registry/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/registry/registry.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/transform/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/transform/apply.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/transform/factory/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/transform/factory/base.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/transform/factory/hadamard.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/transform/factory/matrix_multiply.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/transform/factory/random_hadamard.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/transform/transform_args.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/transform/transform_config.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/transform/transform_scheme.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/transform/utils/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/transform/utils/hadamard.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/transform/utils/hadamards.safetensors RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/transform/utils/matrix.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/utils/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/utils/helpers.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/utils/internal.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/utils/offload.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/utils/permutations_24.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/utils/safetensors_load.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/utils/semi_structured_conversions.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors/utils/type.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors.egg-info/SOURCES.txt RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors.egg-info/dependency_links.txt RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors.egg-info/requires.txt RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/src/compressed_tensors.egg-info/top_level.txt RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/conftest.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/mock_observer.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_compressors/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_compressors/model_compressors/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_compressors/model_compressors/test_model_compressor.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_compressors/quantized_compressors/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_compressors/quantized_compressors/test_fp4_quant.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_compressors/quantized_compressors/test_fp8_quant.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_compressors/quantized_compressors/test_int_quant.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_compressors/quantized_compressors/test_pack_quant.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_compressors/quantized_compressors/test_packed_asym_decompression.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_compressors/sparse_compressors/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_compressors/sparse_compressors/test_bitmask.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_compressors/sparse_compressors/test_sparse_24_bitmask.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_compressors/sparse_quantized_compressors/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_compressors/sparse_quantized_compressors/test_marlin_24.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_configs/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_configs/test_base.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_configs/test_infer_quant.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_examples/test_bitmask_compression_ipynb.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_linear/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_linear/test_compressed_linear.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_modeling/test_attention_and_cache.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_quantization/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_quantization/lifecycle/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_quantization/lifecycle/conftest.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_quantization/lifecycle/test_apply.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_quantization/lifecycle/test_dynamic_lifecycle.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_quantization/lifecycle/test_enabled.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_quantization/lifecycle/test_forward.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_quantization/lifecycle/test_initialize.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_quantization/lifecycle/test_lifecycle.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_quantization/lifecycle/test_static_lifecycle.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_quantization/test_configs/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_quantization/test_configs/test_bit_depths.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_quantization/test_configs/test_strategies.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_quantization/test_quant_args.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_quantization/test_quant_config.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_quantization/test_quant_scheme.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_quantization/test_utils/test_helpers.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_quantization/test_utils/test_mxfp4_utils.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_registry.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_transform/conftest.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_transform/factory/test_correctness.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_transform/factory/test_memory.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_transform/factory/test_serialization.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_transform/test_transform_args.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_transform/test_transform_config.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_transform/test_transform_scheme.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_transform/utils/test_hadamard.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_utils/__init__.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_utils/test_helpers.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_utils/test_offload.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_utils/test_safetensors_load.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/test_utils/test_type.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/tests/testing_utils.py RENAMED Viewed

File without changes

{compressed_tensors-0.12.3a20251114 → compressed_tensors-0.12.3a20251203}/utils/copyright.py RENAMED Viewed

File without changes

compressed-tensors 0.12.3a20251114__tar.gz → 0.12.3a20251203__tar.gz

compressed-tensors 0.12.3a20251114tar.gz → 0.12.3a20251203tar.gz