compressed-tensors-nightly 0.6.0.20240920__tar.gz → 0.6.0.20240921__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (58) hide show
  1. {compressed-tensors-nightly-0.6.0.20240920/src/compressed_tensors_nightly.egg-info → compressed-tensors-nightly-0.6.0.20240921}/PKG-INFO +1 -1
  2. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/config/base.py +6 -1
  3. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/quantization/quant_scheme.py +4 -9
  4. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921/src/compressed_tensors_nightly.egg-info}/PKG-INFO +1 -1
  5. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/LICENSE +0 -0
  6. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/README.md +0 -0
  7. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/pyproject.toml +0 -0
  8. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/setup.cfg +0 -0
  9. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/setup.py +0 -0
  10. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/__init__.py +0 -0
  11. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/base.py +0 -0
  12. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/compressors/__init__.py +0 -0
  13. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/compressors/base.py +0 -0
  14. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/compressors/dense.py +0 -0
  15. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/compressors/helpers.py +0 -0
  16. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/compressors/marlin_24.py +0 -0
  17. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/compressors/model_compressor.py +0 -0
  18. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/compressors/naive_quantized.py +0 -0
  19. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/compressors/pack_quantized.py +0 -0
  20. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/compressors/sparse_bitmask.py +0 -0
  21. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/config/__init__.py +0 -0
  22. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/config/dense.py +0 -0
  23. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/config/sparse_bitmask.py +0 -0
  24. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/linear/__init__.py +0 -0
  25. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/linear/compressed_linear.py +0 -0
  26. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/quantization/__init__.py +0 -0
  27. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/quantization/lifecycle/__init__.py +0 -0
  28. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/quantization/lifecycle/apply.py +0 -0
  29. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/quantization/lifecycle/calibration.py +0 -0
  30. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/quantization/lifecycle/compressed.py +0 -0
  31. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/quantization/lifecycle/forward.py +0 -0
  32. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/quantization/lifecycle/frozen.py +0 -0
  33. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/quantization/lifecycle/helpers.py +0 -0
  34. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/quantization/lifecycle/initialize.py +0 -0
  35. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/quantization/observers/__init__.py +0 -0
  36. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/quantization/observers/base.py +0 -0
  37. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/quantization/observers/helpers.py +0 -0
  38. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/quantization/observers/memoryless.py +0 -0
  39. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/quantization/observers/min_max.py +0 -0
  40. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/quantization/observers/mse.py +0 -0
  41. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/quantization/quant_args.py +0 -0
  42. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/quantization/quant_config.py +0 -0
  43. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/quantization/utils/__init__.py +0 -0
  44. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/quantization/utils/helpers.py +0 -0
  45. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/registry/__init__.py +0 -0
  46. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/registry/registry.py +0 -0
  47. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/utils/__init__.py +0 -0
  48. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/utils/helpers.py +0 -0
  49. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/utils/offload.py +0 -0
  50. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/utils/permutations_24.py +0 -0
  51. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/utils/permute.py +0 -0
  52. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/utils/safetensors_load.py +0 -0
  53. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/utils/semi_structured_conversions.py +0 -0
  54. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors/version.py +0 -0
  55. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors_nightly.egg-info/SOURCES.txt +0 -0
  56. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors_nightly.egg-info/dependency_links.txt +0 -0
  57. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors_nightly.egg-info/requires.txt +0 -0
  58. {compressed-tensors-nightly-0.6.0.20240920 → compressed-tensors-nightly-0.6.0.20240921}/src/compressed_tensors_nightly.egg-info/top_level.txt +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: compressed-tensors-nightly
3
- Version: 0.6.0.20240920
3
+ Version: 0.6.0.20240921
4
4
  Summary: Library for utilization of compressed safetensors of neural network models
5
5
  Home-page: https://github.com/neuralmagic/compressed-tensors
6
6
  Author: Neuralmagic, Inc.
@@ -13,7 +13,7 @@
13
13
  # limitations under the License.
14
14
 
15
15
  from enum import Enum
16
- from typing import Optional
16
+ from typing import List, Optional
17
17
 
18
18
  from compressed_tensors.registry import RegistryMixin
19
19
  from pydantic import BaseModel
@@ -37,11 +37,16 @@ class SparsityCompressionConfig(RegistryMixin, BaseModel):
37
37
  Base data class for storing sparsity compression parameters
38
38
 
39
39
  :param format: name of compression format
40
+ :param targets: List of layer names or layer types that aren't sparse and should
41
+ be ignored during compression. By default, assume all layers are targeted
42
+ :param ignore: List of layer names (unique) to ignore from targets. Defaults to None
40
43
  :param global_sparsity: average sparsity of the entire model
41
44
  :param sparsity_structure: structure of the sparsity, such as
42
45
  "unstructured", "2:4", "8:16" etc
43
46
  """
44
47
 
45
48
  format: str
49
+ targets: Optional[List[str]] = None
50
+ ignore: Optional[List[str]] = None
46
51
  global_sparsity: Optional[float] = 0.0
47
52
  sparsity_structure: Optional[str] = "unstructured"
@@ -57,15 +57,9 @@ class QuantizationScheme(BaseModel):
57
57
  # default to quantizing all Linear layers
58
58
  targets = ["Linear"]
59
59
 
60
- # default to 8 bit integer symmetric quantization
61
- # for weights
62
- weights = QuantizationArgs(num_bits=8, symmetric=True)
63
-
64
- # default to 8 bit integer asymmetric quantization
65
- input_activations = QuantizationArgs(num_bits=8, symmetric=True)
66
-
67
- # Do not quantize the output activations
68
- # by default
60
+ # by default, activations and weights are left unquantized
61
+ weights = None
62
+ input_activations = None
69
63
  output_activations = None
70
64
 
71
65
  return cls(
@@ -110,6 +104,7 @@ def is_preset_scheme(name: str) -> bool:
110
104
  """
111
105
  return name.upper() in PRESET_SCHEMES
112
106
 
107
+
113
108
  UNQUANTIZED = dict()
114
109
 
115
110
  # 8 bit integer weights and 8 bit activations quantization
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: compressed-tensors-nightly
3
- Version: 0.6.0.20240920
3
+ Version: 0.6.0.20240921
4
4
  Summary: Library for utilization of compressed safetensors of neural network models
5
5
  Home-page: https://github.com/neuralmagic/compressed-tensors
6
6
  Author: Neuralmagic, Inc.