compressed-tensors 0.10.3a20250709__py3-none-any.whl → 0.10.3a20250710__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- compressed_tensors/compressors/model_compressors/model_compressor.py +2 -2
- compressed_tensors/compressors/sparse_compressors/sparse_24_bitmask.py +6 -2
- compressed_tensors/version.py +1 -1
- {compressed_tensors-0.10.3a20250709.dist-info → compressed_tensors-0.10.3a20250710.dist-info}/METADATA +1 -1
- {compressed_tensors-0.10.3a20250709.dist-info → compressed_tensors-0.10.3a20250710.dist-info}/RECORD +8 -8
- {compressed_tensors-0.10.3a20250709.dist-info → compressed_tensors-0.10.3a20250710.dist-info}/WHEEL +0 -0
- {compressed_tensors-0.10.3a20250709.dist-info → compressed_tensors-0.10.3a20250710.dist-info}/licenses/LICENSE +0 -0
- {compressed_tensors-0.10.3a20250709.dist-info → compressed_tensors-0.10.3a20250710.dist-info}/top_level.txt +0 -0
@@ -392,8 +392,8 @@ class ModelCompressor:
|
|
392
392
|
for prefix, module in tqdm(model.named_modules(), desc="Compressing model"):
|
393
393
|
|
394
394
|
if prefix in module_to_scheme or prefix in sparse_compression_targets:
|
395
|
-
module_device = get_execution_device(module)
|
396
|
-
is_meta =
|
395
|
+
module_device = get_execution_device(module)
|
396
|
+
is_meta = module_device.type == "meta"
|
397
397
|
|
398
398
|
exec_device = "meta" if is_meta else "cpu"
|
399
399
|
onloading_device = "meta" if is_meta else module_device
|
@@ -178,9 +178,13 @@ def sparse24_bitmask_compress(
|
|
178
178
|
|
179
179
|
if tensor.is_meta:
|
180
180
|
num_rows, num_cols = tensor.shape
|
181
|
-
compressed_values = torch.empty(
|
181
|
+
compressed_values = torch.empty(
|
182
|
+
(num_rows, num_cols // 2), dtype=tensor.dtype, device="meta"
|
183
|
+
)
|
182
184
|
packed_cols = (num_cols + 7) // 8
|
183
|
-
bitmasks_packed = torch.empty(
|
185
|
+
bitmasks_packed = torch.empty(
|
186
|
+
(num_rows, packed_cols), dtype=torch.uint8, device="meta"
|
187
|
+
)
|
184
188
|
return compressed_values, bitmasks_packed
|
185
189
|
|
186
190
|
bytemasks = get_24_bytemasks(tensor=tensor)
|
compressed_tensors/version.py
CHANGED
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.4
|
2
2
|
Name: compressed-tensors
|
3
|
-
Version: 0.10.
|
3
|
+
Version: 0.10.3a20250710
|
4
4
|
Summary: Library for utilization of compressed safetensors of neural network models
|
5
5
|
Home-page: https://github.com/neuralmagic/compressed-tensors
|
6
6
|
Author: Neuralmagic, Inc.
|
{compressed_tensors-0.10.3a20250709.dist-info → compressed_tensors-0.10.3a20250710.dist-info}/RECORD
RENAMED
@@ -1,11 +1,11 @@
|
|
1
1
|
compressed_tensors/__init__.py,sha256=UtKmifNeBCSE2TZSAfduVNNzHY-3V7bLjZ7n7RuXLOE,812
|
2
2
|
compressed_tensors/base.py,sha256=73HYH7HY7O2roC89yG_piPFnZwrBfn_i7HmKl90SKc0,875
|
3
|
-
compressed_tensors/version.py,sha256=
|
3
|
+
compressed_tensors/version.py,sha256=gqWN6LSE0C4r0hiPn2KpmE4YPwpZnktZcE8p9BTZksQ,523
|
4
4
|
compressed_tensors/compressors/__init__.py,sha256=smSygTSfcfuujRrAXDc6uZm4L_ccV1tWZewqVnOb4lM,825
|
5
5
|
compressed_tensors/compressors/base.py,sha256=nvWsv4xEw1Tkxkxth6TmHplDYXfBeP22xWxOsZERyDY,7204
|
6
6
|
compressed_tensors/compressors/helpers.py,sha256=OK6qxX9j3bHwF9JfIYSGMgBJe2PWjlTA3byXKCJaTIQ,5431
|
7
7
|
compressed_tensors/compressors/model_compressors/__init__.py,sha256=5RGGPFu4YqEt_aOdFSQYFYFDjcZFJN0CsMqRtDZz3Js,666
|
8
|
-
compressed_tensors/compressors/model_compressors/model_compressor.py,sha256=
|
8
|
+
compressed_tensors/compressors/model_compressors/model_compressor.py,sha256=Zl33ceJu_KH_Vx2B5EK-bvE7W5OklOL0hb-QqdOVSsE,32906
|
9
9
|
compressed_tensors/compressors/quantized_compressors/__init__.py,sha256=KvaFBL_Q84LxRGJOV035M8OBoCkAx8kOkfphswgkKWk,745
|
10
10
|
compressed_tensors/compressors/quantized_compressors/base.py,sha256=YGUMzbxekj_36ChgQnVZN6T8uDjXtGG1zfMIBGBLWco,10354
|
11
11
|
compressed_tensors/compressors/quantized_compressors/naive_quantized.py,sha256=0ANDcuD8aXPqTYNPY6GnX9iS6eXJw6P0TzNV_rYS2l8,5369
|
@@ -14,7 +14,7 @@ compressed_tensors/compressors/quantized_compressors/pack_quantized.py,sha256=47
|
|
14
14
|
compressed_tensors/compressors/sparse_compressors/__init__.py,sha256=Atuz-OdEgn8OCUhx7Ovd6gXdyImAI186uCR-uR0t_Nk,737
|
15
15
|
compressed_tensors/compressors/sparse_compressors/base.py,sha256=YNZWcHjDleAlqbgRZQ6oJf44MQb_UDNvJGOqhl26uFA,8098
|
16
16
|
compressed_tensors/compressors/sparse_compressors/dense.py,sha256=-OujJ1e0iXBvxYVULrIGvAZ9l-IC0mXczZRnimQdgo4,2314
|
17
|
-
compressed_tensors/compressors/sparse_compressors/sparse_24_bitmask.py,sha256=
|
17
|
+
compressed_tensors/compressors/sparse_compressors/sparse_24_bitmask.py,sha256=p8cNV-W4TZKaWDlCwjptQyaIrwqlHizZ1Pn4Vx3-ANk,9262
|
18
18
|
compressed_tensors/compressors/sparse_compressors/sparse_bitmask.py,sha256=S8vW0FI9ep_XtUQOxj0P5utJt3vKEYOHjWEPp-Xd9aY,5820
|
19
19
|
compressed_tensors/compressors/sparse_quantized_compressors/__init__.py,sha256=4f_cwcKXB1nVVMoiKgTFAc8jAPjPLElo-Df_EDm1_xw,675
|
20
20
|
compressed_tensors/compressors/sparse_quantized_compressors/marlin_24.py,sha256=7F9J6wgkecitK5hHuqjetZ18HExHIF4QIw1wgm2Y6U8,10099
|
@@ -61,8 +61,8 @@ compressed_tensors/utils/permutations_24.py,sha256=kx6fsfDHebx94zsSzhXGyCyuC9sVy
|
|
61
61
|
compressed_tensors/utils/permute.py,sha256=V6tJLKo3Syccj-viv4F7ZKZgJeCB-hl-dK8RKI_kBwI,2355
|
62
62
|
compressed_tensors/utils/safetensors_load.py,sha256=DMfZBuUbA6qp_BG_zIWT3ckiEE33K9ob34s-OgzReO4,12057
|
63
63
|
compressed_tensors/utils/semi_structured_conversions.py,sha256=XKNffPum54kPASgqKzgKvyeqWPAkair2XEQXjkp7ho8,13489
|
64
|
-
compressed_tensors-0.10.
|
65
|
-
compressed_tensors-0.10.
|
66
|
-
compressed_tensors-0.10.
|
67
|
-
compressed_tensors-0.10.
|
68
|
-
compressed_tensors-0.10.
|
64
|
+
compressed_tensors-0.10.3a20250710.dist-info/licenses/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
|
65
|
+
compressed_tensors-0.10.3a20250710.dist-info/METADATA,sha256=TodSeLplEMKQAyDzDHZDT7DPvFFEK5-qUokJdpw2yCg,7031
|
66
|
+
compressed_tensors-0.10.3a20250710.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
|
67
|
+
compressed_tensors-0.10.3a20250710.dist-info/top_level.txt,sha256=w2i-GyPs2s1UwVxvutSvN_lM22SXC2hQFBmoMcPnV7Y,19
|
68
|
+
compressed_tensors-0.10.3a20250710.dist-info/RECORD,,
|
{compressed_tensors-0.10.3a20250709.dist-info → compressed_tensors-0.10.3a20250710.dist-info}/WHEEL
RENAMED
File without changes
|
File without changes
|
File without changes
|