compressed-tensors 0.10.2a20250606__py3-none-any.whl → 0.10.2a20250609__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- compressed_tensors/compressors/model_compressors/model_compressor.py +7 -1
- compressed_tensors/compressors/sparse_compressors/base.py +19 -1
- compressed_tensors/utils/offload.py +3 -0
- compressed_tensors/version.py +1 -1
- {compressed_tensors-0.10.2a20250606.dist-info → compressed_tensors-0.10.2a20250609.dist-info}/METADATA +1 -1
- {compressed_tensors-0.10.2a20250606.dist-info → compressed_tensors-0.10.2a20250609.dist-info}/RECORD +9 -9
- {compressed_tensors-0.10.2a20250606.dist-info → compressed_tensors-0.10.2a20250609.dist-info}/WHEEL +0 -0
- {compressed_tensors-0.10.2a20250606.dist-info → compressed_tensors-0.10.2a20250609.dist-info}/licenses/LICENSE +0 -0
- {compressed_tensors-0.10.2a20250606.dist-info → compressed_tensors-0.10.2a20250609.dist-info}/top_level.txt +0 -0
@@ -68,6 +68,10 @@ from transformers import AutoConfig
|
|
68
68
|
from transformers.file_utils import CONFIG_NAME
|
69
69
|
|
70
70
|
|
71
|
+
if TYPE_CHECKING:
|
72
|
+
from compressed_tensors.compressors import BaseQuantizationCompressor
|
73
|
+
|
74
|
+
|
71
75
|
__all__ = ["ModelCompressor", "map_module_to_scheme"]
|
72
76
|
|
73
77
|
_LOGGER: logging.Logger = logging.getLogger(__name__)
|
@@ -257,7 +261,9 @@ class ModelCompressor:
|
|
257
261
|
self.sparsity_config = sparsity_config
|
258
262
|
self.quantization_config = quantization_config
|
259
263
|
self.sparsity_compressor = None
|
260
|
-
self.quantization_compressor
|
264
|
+
self.quantization_compressor: Optional[
|
265
|
+
Union[BaseQuantizationCompressor, DenseCompressor]
|
266
|
+
] = None
|
261
267
|
|
262
268
|
if sparsity_config is not None:
|
263
269
|
self.sparsity_compressor = BaseCompressor.load_from_registry(
|
@@ -13,8 +13,9 @@
|
|
13
13
|
# limitations under the License.
|
14
14
|
|
15
15
|
import logging
|
16
|
-
from typing import Dict, Generator, Optional, Set, Tuple
|
16
|
+
from typing import TYPE_CHECKING, Dict, Generator, Optional, Set, Tuple
|
17
17
|
|
18
|
+
import torch
|
18
19
|
from compressed_tensors.compressors.base import BaseCompressor
|
19
20
|
from compressed_tensors.utils import (
|
20
21
|
get_nested_mappings_from_state_dict,
|
@@ -26,6 +27,10 @@ from torch import Tensor
|
|
26
27
|
from tqdm import tqdm
|
27
28
|
|
28
29
|
|
30
|
+
if TYPE_CHECKING:
|
31
|
+
from compressed_tensors.quantization import QuantizationScheme
|
32
|
+
|
33
|
+
|
29
34
|
__all__ = ["BaseSparseCompressor"]
|
30
35
|
|
31
36
|
_LOGGER: logging.Logger = logging.getLogger(__name__)
|
@@ -200,3 +205,16 @@ class BaseSparseCompressor(BaseCompressor):
|
|
200
205
|
return (
|
201
206
|
name.endswith(".weight") and name[: -(len(".weight"))] in expanded_targets
|
202
207
|
)
|
208
|
+
|
209
|
+
def decompress_module_from_state_dict(
|
210
|
+
self,
|
211
|
+
prefix: str,
|
212
|
+
state_dict: Dict[str, torch.Tensor],
|
213
|
+
scheme: "QuantizationScheme",
|
214
|
+
) -> Dict[str, torch.Tensor]:
|
215
|
+
"""
|
216
|
+
This function is implemented as a workaround because of how
|
217
|
+
`ModelCompressor.quantization_compressor` can be set to either
|
218
|
+
an instance of `BaseQuantizationCompressor` or `BaseSparseCompressor`.
|
219
|
+
"""
|
220
|
+
return state_dict.copy()
|
@@ -87,12 +87,15 @@ def check_accelerate(fallback: Any):
|
|
87
87
|
if not _has_accelerate:
|
88
88
|
|
89
89
|
if fallback == "error":
|
90
|
+
|
90
91
|
@wraps(func)
|
91
92
|
def fallback_fn(*args, **kwargs):
|
92
93
|
raise ValueError(
|
93
94
|
"Please install `accelerate` in order to use this function"
|
94
95
|
)
|
96
|
+
|
95
97
|
else:
|
98
|
+
|
96
99
|
@wraps(func)
|
97
100
|
def fallback_fn(*args, **kwargs):
|
98
101
|
return fallback
|
compressed_tensors/version.py
CHANGED
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.4
|
2
2
|
Name: compressed-tensors
|
3
|
-
Version: 0.10.
|
3
|
+
Version: 0.10.2a20250609
|
4
4
|
Summary: Library for utilization of compressed safetensors of neural network models
|
5
5
|
Home-page: https://github.com/neuralmagic/compressed-tensors
|
6
6
|
Author: Neuralmagic, Inc.
|
{compressed_tensors-0.10.2a20250606.dist-info → compressed_tensors-0.10.2a20250609.dist-info}/RECORD
RENAMED
@@ -1,18 +1,18 @@
|
|
1
1
|
compressed_tensors/__init__.py,sha256=UtKmifNeBCSE2TZSAfduVNNzHY-3V7bLjZ7n7RuXLOE,812
|
2
2
|
compressed_tensors/base.py,sha256=73HYH7HY7O2roC89yG_piPFnZwrBfn_i7HmKl90SKc0,875
|
3
|
-
compressed_tensors/version.py,sha256=
|
3
|
+
compressed_tensors/version.py,sha256=LTla_Pj0LNUtkAT7ETF33M0rqtov9c8Q6T5tjzwvHOs,523
|
4
4
|
compressed_tensors/compressors/__init__.py,sha256=smSygTSfcfuujRrAXDc6uZm4L_ccV1tWZewqVnOb4lM,825
|
5
5
|
compressed_tensors/compressors/base.py,sha256=nvWsv4xEw1Tkxkxth6TmHplDYXfBeP22xWxOsZERyDY,7204
|
6
6
|
compressed_tensors/compressors/helpers.py,sha256=OK6qxX9j3bHwF9JfIYSGMgBJe2PWjlTA3byXKCJaTIQ,5431
|
7
7
|
compressed_tensors/compressors/model_compressors/__init__.py,sha256=5RGGPFu4YqEt_aOdFSQYFYFDjcZFJN0CsMqRtDZz3Js,666
|
8
|
-
compressed_tensors/compressors/model_compressors/model_compressor.py,sha256=
|
8
|
+
compressed_tensors/compressors/model_compressors/model_compressor.py,sha256=nt0KxhZakDdlTIebBYcSvqxLCZhA6p6IL_1AYiHLFug,32695
|
9
9
|
compressed_tensors/compressors/quantized_compressors/__init__.py,sha256=KvaFBL_Q84LxRGJOV035M8OBoCkAx8kOkfphswgkKWk,745
|
10
10
|
compressed_tensors/compressors/quantized_compressors/base.py,sha256=ByE3z61boZ5wdz0nhc-2CJH61bSixJQE78pfkS6XRDg,10269
|
11
11
|
compressed_tensors/compressors/quantized_compressors/naive_quantized.py,sha256=0ANDcuD8aXPqTYNPY6GnX9iS6eXJw6P0TzNV_rYS2l8,5369
|
12
12
|
compressed_tensors/compressors/quantized_compressors/nvfp4_quantized.py,sha256=Gw-lVzk5jrKUlM5UTCiJBmhM5gHzB9mn8r298MVUbDI,6395
|
13
13
|
compressed_tensors/compressors/quantized_compressors/pack_quantized.py,sha256=_66tQ8bxslDUdas-ULORXblPw9kdNNn1UJJU9-ZOGPY,11380
|
14
14
|
compressed_tensors/compressors/sparse_compressors/__init__.py,sha256=Atuz-OdEgn8OCUhx7Ovd6gXdyImAI186uCR-uR0t_Nk,737
|
15
|
-
compressed_tensors/compressors/sparse_compressors/base.py,sha256=
|
15
|
+
compressed_tensors/compressors/sparse_compressors/base.py,sha256=4-7Hm2uJ4qYtl4hi6GqwegGg2gYNhbq7noledK3h86Q,8684
|
16
16
|
compressed_tensors/compressors/sparse_compressors/dense.py,sha256=rPaxbP7P52prWNs4lGaiBbpNvsQLElFMwOrq1oBP2Yg,1733
|
17
17
|
compressed_tensors/compressors/sparse_compressors/sparse_24_bitmask.py,sha256=4cwkj40SFrXEyE_jyt2xjz3R-gTdU9uMpMFUKo1pRBA,8643
|
18
18
|
compressed_tensors/compressors/sparse_compressors/sparse_bitmask.py,sha256=S8vW0FI9ep_XtUQOxj0P5utJt3vKEYOHjWEPp-Xd9aY,5820
|
@@ -48,13 +48,13 @@ compressed_tensors/transform/utils/hadamard.py,sha256=SmPZmnHtc5N36gJA5EbM1T65uf
|
|
48
48
|
compressed_tensors/transform/utils/utils.py,sha256=PRPTYwPs2nnNaQMq2GEbC4QYKHFKlZwaRyPgdDhl66g,2992
|
49
49
|
compressed_tensors/utils/__init__.py,sha256=gS4gSU2pwcAbsKj-6YMaqhm25udFy6ISYaWBf-myRSM,808
|
50
50
|
compressed_tensors/utils/helpers.py,sha256=cPg-ikdeA92aIGwBONg8GmPNvcGlFhozyJVwsRiXBTA,11981
|
51
|
-
compressed_tensors/utils/offload.py,sha256=
|
51
|
+
compressed_tensors/utils/offload.py,sha256=aGcBv0UWLuauY_-HBSei5Gm0xsZOfWn7NeX76tcLf30,20319
|
52
52
|
compressed_tensors/utils/permutations_24.py,sha256=kx6fsfDHebx94zsSzhXGyCyuC9sVyah6BUUir_StT28,2530
|
53
53
|
compressed_tensors/utils/permute.py,sha256=V6tJLKo3Syccj-viv4F7ZKZgJeCB-hl-dK8RKI_kBwI,2355
|
54
54
|
compressed_tensors/utils/safetensors_load.py,sha256=DMfZBuUbA6qp_BG_zIWT3ckiEE33K9ob34s-OgzReO4,12057
|
55
55
|
compressed_tensors/utils/semi_structured_conversions.py,sha256=XKNffPum54kPASgqKzgKvyeqWPAkair2XEQXjkp7ho8,13489
|
56
|
-
compressed_tensors-0.10.
|
57
|
-
compressed_tensors-0.10.
|
58
|
-
compressed_tensors-0.10.
|
59
|
-
compressed_tensors-0.10.
|
60
|
-
compressed_tensors-0.10.
|
56
|
+
compressed_tensors-0.10.2a20250609.dist-info/licenses/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
|
57
|
+
compressed_tensors-0.10.2a20250609.dist-info/METADATA,sha256=_OH8bysJ6ymrDyfkHXrKuZNb47qh38hfdCCOt7RRYeM,7005
|
58
|
+
compressed_tensors-0.10.2a20250609.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
|
59
|
+
compressed_tensors-0.10.2a20250609.dist-info/top_level.txt,sha256=w2i-GyPs2s1UwVxvutSvN_lM22SXC2hQFBmoMcPnV7Y,19
|
60
|
+
compressed_tensors-0.10.2a20250609.dist-info/RECORD,,
|
{compressed_tensors-0.10.2a20250606.dist-info → compressed_tensors-0.10.2a20250609.dist-info}/WHEEL
RENAMED
File without changes
|
File without changes
|
File without changes
|