compressed-tensors-nightly 0.7.1.20241023__tar.gz → 0.7.1.20241024__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (64) hide show
  1. {compressed-tensors-nightly-0.7.1.20241023/src/compressed_tensors_nightly.egg-info → compressed-tensors-nightly-0.7.1.20241024}/PKG-INFO +1 -1
  2. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/quantization/lifecycle/calibration.py +2 -4
  3. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/quantization/lifecycle/frozen.py +0 -1
  4. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/quantization/observers/helpers.py +1 -1
  5. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/quantization/observers/mse.py +3 -1
  6. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024/src/compressed_tensors_nightly.egg-info}/PKG-INFO +1 -1
  7. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/LICENSE +0 -0
  8. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/README.md +0 -0
  9. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/pyproject.toml +0 -0
  10. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/setup.cfg +0 -0
  11. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/setup.py +0 -0
  12. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/__init__.py +0 -0
  13. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/base.py +0 -0
  14. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/compressors/__init__.py +0 -0
  15. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/compressors/base.py +0 -0
  16. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/compressors/helpers.py +0 -0
  17. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/compressors/model_compressors/__init__.py +0 -0
  18. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/compressors/model_compressors/model_compressor.py +0 -0
  19. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/compressors/quantized_compressors/__init__.py +0 -0
  20. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/compressors/quantized_compressors/base.py +0 -0
  21. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/compressors/quantized_compressors/naive_quantized.py +0 -0
  22. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/compressors/quantized_compressors/pack_quantized.py +0 -0
  23. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/compressors/sparse_compressors/__init__.py +0 -0
  24. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/compressors/sparse_compressors/base.py +0 -0
  25. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/compressors/sparse_compressors/dense.py +0 -0
  26. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/compressors/sparse_compressors/sparse_bitmask.py +0 -0
  27. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/compressors/sparse_quantized_compressors/__init__.py +0 -0
  28. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/compressors/sparse_quantized_compressors/marlin_24.py +0 -0
  29. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/config/__init__.py +0 -0
  30. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/config/base.py +0 -0
  31. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/config/dense.py +0 -0
  32. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/config/sparse_bitmask.py +0 -0
  33. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/linear/__init__.py +0 -0
  34. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/linear/compressed_linear.py +0 -0
  35. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/quantization/__init__.py +0 -0
  36. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/quantization/cache.py +0 -0
  37. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/quantization/lifecycle/__init__.py +0 -0
  38. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/quantization/lifecycle/apply.py +0 -0
  39. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/quantization/lifecycle/compressed.py +0 -0
  40. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/quantization/lifecycle/forward.py +0 -0
  41. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/quantization/lifecycle/helpers.py +0 -0
  42. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/quantization/lifecycle/initialize.py +0 -0
  43. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/quantization/observers/__init__.py +0 -0
  44. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/quantization/observers/base.py +0 -0
  45. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/quantization/observers/min_max.py +0 -0
  46. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/quantization/quant_args.py +0 -0
  47. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/quantization/quant_config.py +0 -0
  48. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/quantization/quant_scheme.py +0 -0
  49. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/quantization/utils/__init__.py +0 -0
  50. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/quantization/utils/helpers.py +0 -0
  51. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/registry/__init__.py +0 -0
  52. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/registry/registry.py +0 -0
  53. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/utils/__init__.py +0 -0
  54. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/utils/helpers.py +0 -0
  55. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/utils/offload.py +0 -0
  56. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/utils/permutations_24.py +0 -0
  57. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/utils/permute.py +0 -0
  58. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/utils/safetensors_load.py +0 -0
  59. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/utils/semi_structured_conversions.py +0 -0
  60. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors/version.py +0 -0
  61. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors_nightly.egg-info/SOURCES.txt +0 -0
  62. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors_nightly.egg-info/dependency_links.txt +0 -0
  63. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors_nightly.egg-info/requires.txt +0 -0
  64. {compressed-tensors-nightly-0.7.1.20241023 → compressed-tensors-nightly-0.7.1.20241024}/src/compressed_tensors_nightly.egg-info/top_level.txt +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: compressed-tensors-nightly
3
- Version: 0.7.1.20241023
3
+ Version: 0.7.1.20241024
4
4
  Summary: Library for utilization of compressed safetensors of neural network models
5
5
  Home-page: https://github.com/neuralmagic/compressed-tensors
6
6
  Author: Neuralmagic, Inc.
@@ -64,14 +64,12 @@ def set_module_for_calibration(module: Module, quantize_weights_upfront: bool =
64
64
  quantization_args=module.quantization_scheme.weights,
65
65
  )
66
66
 
67
- observer = module.weight_observer
68
-
69
- g_idx = getattr(module, "weight_g_idx", None)
70
-
71
67
  offloaded = is_module_offloaded(module)
72
68
  if offloaded:
73
69
  module._hf_hook.pre_forward(module)
74
70
 
71
+ observer = module.weight_observer
72
+ g_idx = getattr(module, "weight_g_idx", None)
75
73
  scale, zero_point = observer(module.weight, g_idx=g_idx)
76
74
  update_parameter_data(module, scale, "weight_scale")
77
75
  update_parameter_data(module, zero_point, "weight_zero_point")
@@ -14,7 +14,6 @@
14
14
 
15
15
 
16
16
  from compressed_tensors.quantization.quant_config import QuantizationStatus
17
- from compressed_tensors.quantization.utils import is_kv_cache_quant_scheme
18
17
  from torch.nn import Module
19
18
 
20
19
 
@@ -13,7 +13,7 @@
13
13
  # limitations under the License.
14
14
 
15
15
  from collections import Counter
16
- from typing import Optional, Tuple
16
+ from typing import Tuple
17
17
 
18
18
  import torch
19
19
  from compressed_tensors.quantization.quant_args import (
@@ -70,7 +70,9 @@ class MovingAverageMSEObserver(Observer):
70
70
  absolute_min_val = torch.amin(observed, dim=reduce_dims, keepdims=True)
71
71
  absolute_max_val = torch.amax(observed, dim=reduce_dims, keepdims=True)
72
72
 
73
- best = torch.full_like(absolute_min_val, torch.finfo(absolute_min_val.dtype).max)
73
+ best = torch.full_like(
74
+ absolute_min_val, torch.finfo(absolute_min_val.dtype).max
75
+ )
74
76
  min_val = torch.ones_like(absolute_min_val)
75
77
  max_val = torch.zeros_like(absolute_max_val)
76
78
  for i in range(int(self.maxshrink * self.grid)):
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: compressed-tensors-nightly
3
- Version: 0.7.1.20241023
3
+ Version: 0.7.1.20241024
4
4
  Summary: Library for utilization of compressed safetensors of neural network models
5
5
  Home-page: https://github.com/neuralmagic/compressed-tensors
6
6
  Author: Neuralmagic, Inc.