compressed-tensors-nightly 0.9.2.20250227__py3-none-any.whl → 0.9.2.20250301__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -21,6 +21,7 @@ from compressed_tensors.quantization import (
21
21
  QuantizationStatus,
22
22
  initialize_module_for_quantization,
23
23
  )
24
+ from compressed_tensors.utils import register_offload_parameter
24
25
  from torch import Tensor
25
26
  from torch.nn import Parameter
26
27
  from torch.nn.functional import linear
@@ -68,7 +69,7 @@ class CompressedLinear(Linear):
68
69
  param = Parameter(
69
70
  torch.empty(shape, device=device, dtype=dtype), requires_grad=False
70
71
  )
71
- module.register_parameter(name, param)
72
+ register_offload_parameter(module, name, param)
72
73
 
73
74
  # mark module as compressed
74
75
  module.quantization_status = QuantizationStatus.COMPRESSED
@@ -203,11 +203,10 @@ def _initialize_attn_scales(module: Module) -> None:
203
203
  torch.empty(expected_shape, dtype=scale_dtype, device=device),
204
204
  requires_grad=False,
205
205
  )
206
-
207
- module.register_parameter(KVCacheScaleType.KEY.value, init_scale)
206
+ register_offload_parameter(module, KVCacheScaleType.KEY.value, init_scale)
208
207
 
209
208
  init_scale = Parameter(
210
209
  torch.empty(expected_shape, dtype=scale_dtype, device=device),
211
210
  requires_grad=False,
212
211
  )
213
- module.register_parameter(KVCacheScaleType.VALUE.value, init_scale)
212
+ register_offload_parameter(module, KVCacheScaleType.VALUE.value, init_scale)
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.2
2
2
  Name: compressed-tensors-nightly
3
- Version: 0.9.2.20250227
3
+ Version: 0.9.2.20250301
4
4
  Summary: Library for utilization of compressed safetensors of neural network models
5
5
  Home-page: https://github.com/neuralmagic/compressed-tensors
6
6
  Author: Neuralmagic, Inc.
@@ -23,7 +23,7 @@ compressed_tensors/config/dense.py,sha256=NgSxnFCnckU9-iunxEaqiFwqgdO7YYxlWKR74j
23
23
  compressed_tensors/config/sparse_24_bitmask.py,sha256=Lhj39zT2V1hxftprvxvneyhv45ShlXOKd75DBbDTyTE,1401
24
24
  compressed_tensors/config/sparse_bitmask.py,sha256=pZUboRNZTu6NajGOQEFExoPknak5ynVAUeiiYpS1Gt8,1308
25
25
  compressed_tensors/linear/__init__.py,sha256=fH6rjBYAxuwrTzBTlTjTgCYNyh6TCvCqajCz4Im4YrA,617
26
- compressed_tensors/linear/compressed_linear.py,sha256=MJa-UfoKhIkdUWRD1shrXXri2cOwR5GK0a4t4bNYosM,3268
26
+ compressed_tensors/linear/compressed_linear.py,sha256=OjROJloHR5epRQOp-0OBTCUKhbgitmiSFKSRFwJ7nLA,3341
27
27
  compressed_tensors/quantization/__init__.py,sha256=83J5bPB7PavN2TfCoW7_vEDhfYpm4TDrqYO9vdSQ5bk,760
28
28
  compressed_tensors/quantization/quant_args.py,sha256=sKpb8DcNObidjXjNol1Tn_Iih3ZXBycSp-fyz68TGhY,9117
29
29
  compressed_tensors/quantization/quant_config.py,sha256=vx06wBo91p4LCb3Vzd-2eCTUeIf_Sz2ZXRP263eQyjQ,10385
@@ -33,7 +33,7 @@ compressed_tensors/quantization/lifecycle/apply.py,sha256=lZmCCSm1_o79iUAy460w6B
33
33
  compressed_tensors/quantization/lifecycle/compressed.py,sha256=Fj9n66IN0EWsOAkBHg3O0GlOQpxstqjCcs0ttzMXrJ0,2296
34
34
  compressed_tensors/quantization/lifecycle/forward.py,sha256=DOWouUqfaLA4Qhg-ojVVBdhhSAlgZqFC26vZARxE0ko,12961
35
35
  compressed_tensors/quantization/lifecycle/helpers.py,sha256=C0mhy2vJ0fCjVeN4kFNhw8Eq1wkteBGHiZ36RVLThRY,944
36
- compressed_tensors/quantization/lifecycle/initialize.py,sha256=hymYtayTSumm8KCYAYPY267aWmlsJpt8oQFiRblk8qE,7452
36
+ compressed_tensors/quantization/lifecycle/initialize.py,sha256=sK3PLm69N91QepBuq-83Qd2Br6XcOmRDpD5qo_WWNJo,7469
37
37
  compressed_tensors/quantization/utils/__init__.py,sha256=VdtEmP0bvuND_IGQnyqUPc5lnFp-1_yD7StKSX4x80w,656
38
38
  compressed_tensors/quantization/utils/helpers.py,sha256=DBP-sGRpGAY01K0LFE7qqonNj4hkTYL_mXrMs2LtAD8,14100
39
39
  compressed_tensors/registry/__init__.py,sha256=FwLSNYqfIrb5JD_6OK_MT4_svvKTN_nEhpgQlQvGbjI,658
@@ -45,8 +45,8 @@ compressed_tensors/utils/permutations_24.py,sha256=kx6fsfDHebx94zsSzhXGyCyuC9sVy
45
45
  compressed_tensors/utils/permute.py,sha256=V6tJLKo3Syccj-viv4F7ZKZgJeCB-hl-dK8RKI_kBwI,2355
46
46
  compressed_tensors/utils/safetensors_load.py,sha256=5SeM2hzLh77Ne8Vk7qR6-km7cf8bhov41ExpWITqX3A,11470
47
47
  compressed_tensors/utils/semi_structured_conversions.py,sha256=XKNffPum54kPASgqKzgKvyeqWPAkair2XEQXjkp7ho8,13489
48
- compressed_tensors_nightly-0.9.2.20250227.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
49
- compressed_tensors_nightly-0.9.2.20250227.dist-info/METADATA,sha256=YA_gOsRnfooU8JnPC5pBW2ixnmiyLNvuG46KzvAw8qM,6992
50
- compressed_tensors_nightly-0.9.2.20250227.dist-info/WHEEL,sha256=jB7zZ3N9hIM9adW7qlTAyycLYW9npaWKLRzaoVcLKcM,91
51
- compressed_tensors_nightly-0.9.2.20250227.dist-info/top_level.txt,sha256=w2i-GyPs2s1UwVxvutSvN_lM22SXC2hQFBmoMcPnV7Y,19
52
- compressed_tensors_nightly-0.9.2.20250227.dist-info/RECORD,,
48
+ compressed_tensors_nightly-0.9.2.20250301.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
49
+ compressed_tensors_nightly-0.9.2.20250301.dist-info/METADATA,sha256=T0VJWcmuTyaavb6vTZWOzqmtLw9-QBzK3YG_SJTdR-4,6992
50
+ compressed_tensors_nightly-0.9.2.20250301.dist-info/WHEEL,sha256=jB7zZ3N9hIM9adW7qlTAyycLYW9npaWKLRzaoVcLKcM,91
51
+ compressed_tensors_nightly-0.9.2.20250301.dist-info/top_level.txt,sha256=w2i-GyPs2s1UwVxvutSvN_lM22SXC2hQFBmoMcPnV7Y,19
52
+ compressed_tensors_nightly-0.9.2.20250301.dist-info/RECORD,,