compressed-tensors-nightly 0.9.2.20250307__tar.gz → 0.9.2.20250311__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (60) hide show
  1. {compressed_tensors_nightly-0.9.2.20250307/src/compressed_tensors_nightly.egg-info → compressed_tensors_nightly-0.9.2.20250311}/PKG-INFO +1 -1
  2. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/linear/compressed_linear.py +16 -7
  3. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311/src/compressed_tensors_nightly.egg-info}/PKG-INFO +1 -1
  4. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/LICENSE +0 -0
  5. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/README.md +0 -0
  6. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/pyproject.toml +0 -0
  7. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/setup.cfg +0 -0
  8. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/setup.py +0 -0
  9. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/__init__.py +0 -0
  10. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/base.py +0 -0
  11. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/compressors/__init__.py +0 -0
  12. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/compressors/base.py +0 -0
  13. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/compressors/helpers.py +0 -0
  14. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/compressors/model_compressors/__init__.py +0 -0
  15. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/compressors/model_compressors/model_compressor.py +0 -0
  16. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/compressors/quantized_compressors/__init__.py +0 -0
  17. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/compressors/quantized_compressors/base.py +0 -0
  18. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/compressors/quantized_compressors/naive_quantized.py +0 -0
  19. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/compressors/quantized_compressors/pack_quantized.py +0 -0
  20. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/compressors/sparse_compressors/__init__.py +0 -0
  21. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/compressors/sparse_compressors/base.py +0 -0
  22. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/compressors/sparse_compressors/dense.py +0 -0
  23. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/compressors/sparse_compressors/sparse_24_bitmask.py +0 -0
  24. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/compressors/sparse_compressors/sparse_bitmask.py +0 -0
  25. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/compressors/sparse_quantized_compressors/__init__.py +0 -0
  26. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/compressors/sparse_quantized_compressors/marlin_24.py +0 -0
  27. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/config/__init__.py +0 -0
  28. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/config/base.py +0 -0
  29. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/config/dense.py +0 -0
  30. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/config/sparse_24_bitmask.py +0 -0
  31. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/config/sparse_bitmask.py +0 -0
  32. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/linear/__init__.py +0 -0
  33. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/quantization/__init__.py +0 -0
  34. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/quantization/lifecycle/__init__.py +0 -0
  35. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/quantization/lifecycle/apply.py +0 -0
  36. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/quantization/lifecycle/compressed.py +0 -0
  37. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/quantization/lifecycle/forward.py +0 -0
  38. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/quantization/lifecycle/helpers.py +0 -0
  39. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/quantization/lifecycle/initialize.py +0 -0
  40. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/quantization/quant_args.py +0 -0
  41. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/quantization/quant_config.py +0 -0
  42. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/quantization/quant_scheme.py +0 -0
  43. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/quantization/utils/__init__.py +0 -0
  44. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/quantization/utils/helpers.py +0 -0
  45. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/registry/__init__.py +0 -0
  46. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/registry/registry.py +0 -0
  47. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/utils/__init__.py +0 -0
  48. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/utils/helpers.py +0 -0
  49. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/utils/offload.py +0 -0
  50. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/utils/permutations_24.py +0 -0
  51. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/utils/permute.py +0 -0
  52. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/utils/safetensors_load.py +0 -0
  53. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/utils/semi_structured_conversions.py +0 -0
  54. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors/version.py +0 -0
  55. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors_nightly.egg-info/SOURCES.txt +0 -0
  56. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors_nightly.egg-info/dependency_links.txt +0 -0
  57. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors_nightly.egg-info/requires.txt +0 -0
  58. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/src/compressed_tensors_nightly.egg-info/top_level.txt +0 -0
  59. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/tests/test_registry.py +0 -0
  60. {compressed_tensors_nightly-0.9.2.20250307 → compressed_tensors_nightly-0.9.2.20250311}/tests/testing_utils.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.2
2
2
  Name: compressed-tensors-nightly
3
- Version: 0.9.2.20250307
3
+ Version: 0.9.2.20250311
4
4
  Summary: Library for utilization of compressed safetensors of neural network models
5
5
  Home-page: https://github.com/neuralmagic/compressed-tensors
6
6
  Author: Neuralmagic, Inc.
@@ -12,6 +12,7 @@
12
12
  # See the License for the specific language governing permissions and
13
13
  # limitations under the License.
14
14
 
15
+ import warnings
15
16
  from typing import Dict, Tuple
16
17
 
17
18
  import torch
@@ -33,14 +34,15 @@ class CompressedLinear(Linear):
33
34
  Wrapper module for running a compressed forward pass of a quantized Linear module.
34
35
  The wrapped layer will decompressed on each forward call.
35
36
 
36
- :param module: dense linear module to replace
37
- :param quantization_scheme: quantization config for the module to wrap
38
- :param quantization_format: compression format module is stored as
39
37
  """
40
38
 
41
39
  def __init__(self, *args, **kwargs) -> None:
42
40
  super().__init__(*args, **kwargs)
43
- self._is_compressed = True
41
+ warnings.warn(
42
+ "CompressedLinear should not be initialized directly. "
43
+ "Use the from_linear method instead.",
44
+ UserWarning,
45
+ )
44
46
 
45
47
  @classmethod
46
48
  @torch.no_grad()
@@ -50,6 +52,12 @@ class CompressedLinear(Linear):
50
52
  quantization_scheme: QuantizationScheme,
51
53
  quantization_format: str,
52
54
  ):
55
+ """
56
+ :param module: dense linear module to replace
57
+ :param quantization_scheme: quantization config for the module to wrap
58
+ :param quantization_format: compression format module is stored as
59
+ :return: CompressedLinear module wrapping the input module
60
+ """
53
61
  module.__class__ = CompressedLinear
54
62
  module.compressor = BaseCompressor.load_from_registry(quantization_format)
55
63
  device = next(module.parameters()).device
@@ -90,8 +98,9 @@ class CompressedLinear(Linear):
90
98
  """
91
99
  Decompresses the weight, then runs the wrapped forward pass
92
100
  """
93
- if self._is_compressed:
94
- self.weight = self.compressor.decompress_module(self)
95
- self._is_compressed = False
101
+ if self.quantization_status == QuantizationStatus.COMPRESSED:
102
+ decompressed_weight = self.compressor.decompress_module(self)
103
+ self.weight.data = decompressed_weight
104
+ self.quantization_status = QuantizationStatus.FROZEN
96
105
 
97
106
  return linear(input, self.weight, self.bias)
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.2
2
2
  Name: compressed-tensors-nightly
3
- Version: 0.9.2.20250307
3
+ Version: 0.9.2.20250311
4
4
  Summary: Library for utilization of compressed safetensors of neural network models
5
5
  Home-page: https://github.com/neuralmagic/compressed-tensors
6
6
  Author: Neuralmagic, Inc.