compressed-tensors-nightly 0.8.1.20241218__py3-none-any.whl → 0.8.1.20241220__py3-none-any.whl
Sign up to get free protection for your applications and to get access to all the features.
- compressed_tensors/quantization/lifecycle/initialize.py +4 -1
- {compressed_tensors_nightly-0.8.1.20241218.dist-info → compressed_tensors_nightly-0.8.1.20241220.dist-info}/METADATA +1 -1
- {compressed_tensors_nightly-0.8.1.20241218.dist-info → compressed_tensors_nightly-0.8.1.20241220.dist-info}/RECORD +6 -6
- {compressed_tensors_nightly-0.8.1.20241218.dist-info → compressed_tensors_nightly-0.8.1.20241220.dist-info}/LICENSE +0 -0
- {compressed_tensors_nightly-0.8.1.20241218.dist-info → compressed_tensors_nightly-0.8.1.20241220.dist-info}/WHEEL +0 -0
- {compressed_tensors_nightly-0.8.1.20241218.dist-info → compressed_tensors_nightly-0.8.1.20241220.dist-info}/top_level.txt +0 -0
@@ -174,7 +174,10 @@ def _initialize_scale_zero_point(
|
|
174
174
|
device = get_execution_device(module)
|
175
175
|
|
176
176
|
# infer expected scale/zero point shape
|
177
|
-
|
177
|
+
if quantization_args.strategy == QuantizationStrategy.TOKEN:
|
178
|
+
expected_shape = (1, 1)
|
179
|
+
else:
|
180
|
+
expected_shape = 1
|
178
181
|
|
179
182
|
if base_name == "weight" and weight_shape is not None:
|
180
183
|
if quantization_args.strategy == QuantizationStrategy.CHANNEL:
|
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.1
|
2
2
|
Name: compressed-tensors-nightly
|
3
|
-
Version: 0.8.1.
|
3
|
+
Version: 0.8.1.20241220
|
4
4
|
Summary: Library for utilization of compressed safetensors of neural network models
|
5
5
|
Home-page: https://github.com/neuralmagic/compressed-tensors
|
6
6
|
Author: Neuralmagic, Inc.
|
@@ -31,7 +31,7 @@ compressed_tensors/quantization/lifecycle/apply.py,sha256=jCUSgeOBtagE5IhgIbyYMZ
|
|
31
31
|
compressed_tensors/quantization/lifecycle/compressed.py,sha256=Fj9n66IN0EWsOAkBHg3O0GlOQpxstqjCcs0ttzMXrJ0,2296
|
32
32
|
compressed_tensors/quantization/lifecycle/forward.py,sha256=QPL6-vKOFuKdKIEsVqMhsw4x552Jpm2sqO0oeChbnrM,12941
|
33
33
|
compressed_tensors/quantization/lifecycle/helpers.py,sha256=C0mhy2vJ0fCjVeN4kFNhw8Eq1wkteBGHiZ36RVLThRY,944
|
34
|
-
compressed_tensors/quantization/lifecycle/initialize.py,sha256=
|
34
|
+
compressed_tensors/quantization/lifecycle/initialize.py,sha256=WFhbdrKHRZj_kScYCua6HMSbD9rKb8juB6k_EZj7EN4,8634
|
35
35
|
compressed_tensors/quantization/utils/__init__.py,sha256=VdtEmP0bvuND_IGQnyqUPc5lnFp-1_yD7StKSX4x80w,656
|
36
36
|
compressed_tensors/quantization/utils/helpers.py,sha256=DBP-sGRpGAY01K0LFE7qqonNj4hkTYL_mXrMs2LtAD8,14100
|
37
37
|
compressed_tensors/registry/__init__.py,sha256=FwLSNYqfIrb5JD_6OK_MT4_svvKTN_nEhpgQlQvGbjI,658
|
@@ -43,8 +43,8 @@ compressed_tensors/utils/permutations_24.py,sha256=kx6fsfDHebx94zsSzhXGyCyuC9sVy
|
|
43
43
|
compressed_tensors/utils/permute.py,sha256=V6tJLKo3Syccj-viv4F7ZKZgJeCB-hl-dK8RKI_kBwI,2355
|
44
44
|
compressed_tensors/utils/safetensors_load.py,sha256=m08ANVuTBxQdoa6LufDgcNJ7wCLDJolyZljB8VEybAU,8578
|
45
45
|
compressed_tensors/utils/semi_structured_conversions.py,sha256=XKNffPum54kPASgqKzgKvyeqWPAkair2XEQXjkp7ho8,13489
|
46
|
-
compressed_tensors_nightly-0.8.1.
|
47
|
-
compressed_tensors_nightly-0.8.1.
|
48
|
-
compressed_tensors_nightly-0.8.1.
|
49
|
-
compressed_tensors_nightly-0.8.1.
|
50
|
-
compressed_tensors_nightly-0.8.1.
|
46
|
+
compressed_tensors_nightly-0.8.1.20241220.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
|
47
|
+
compressed_tensors_nightly-0.8.1.20241220.dist-info/METADATA,sha256=KDGxrqR4lES09Mf7qx-xR7SAdc3Cb5TKmqsePVyjYug,6799
|
48
|
+
compressed_tensors_nightly-0.8.1.20241220.dist-info/WHEEL,sha256=tZoeGjtWxWRfdplE7E3d45VPlLNQnvbKiYnx7gwAy8A,92
|
49
|
+
compressed_tensors_nightly-0.8.1.20241220.dist-info/top_level.txt,sha256=w2i-GyPs2s1UwVxvutSvN_lM22SXC2hQFBmoMcPnV7Y,19
|
50
|
+
compressed_tensors_nightly-0.8.1.20241220.dist-info/RECORD,,
|
File without changes
|
File without changes
|