compressed-tensors-nightly 0.6.0.20240923__tar.gz → 0.6.0.20240925__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (58) hide show
  1. {compressed-tensors-nightly-0.6.0.20240923/src/compressed_tensors_nightly.egg-info → compressed-tensors-nightly-0.6.0.20240925}/PKG-INFO +1 -1
  2. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/__init__.py +1 -0
  3. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/compressors/model_compressor.py +2 -0
  4. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/quantization/quant_scheme.py +5 -4
  5. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925/src/compressed_tensors_nightly.egg-info}/PKG-INFO +1 -1
  6. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/LICENSE +0 -0
  7. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/README.md +0 -0
  8. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/pyproject.toml +0 -0
  9. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/setup.cfg +0 -0
  10. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/setup.py +0 -0
  11. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/base.py +0 -0
  12. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/compressors/__init__.py +0 -0
  13. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/compressors/base.py +0 -0
  14. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/compressors/dense.py +0 -0
  15. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/compressors/helpers.py +0 -0
  16. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/compressors/marlin_24.py +0 -0
  17. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/compressors/naive_quantized.py +0 -0
  18. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/compressors/pack_quantized.py +0 -0
  19. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/compressors/sparse_bitmask.py +0 -0
  20. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/config/__init__.py +0 -0
  21. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/config/base.py +0 -0
  22. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/config/dense.py +0 -0
  23. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/config/sparse_bitmask.py +0 -0
  24. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/linear/__init__.py +0 -0
  25. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/linear/compressed_linear.py +0 -0
  26. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/quantization/__init__.py +0 -0
  27. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/quantization/lifecycle/__init__.py +0 -0
  28. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/quantization/lifecycle/apply.py +0 -0
  29. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/quantization/lifecycle/calibration.py +0 -0
  30. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/quantization/lifecycle/compressed.py +0 -0
  31. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/quantization/lifecycle/forward.py +0 -0
  32. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/quantization/lifecycle/frozen.py +0 -0
  33. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/quantization/lifecycle/helpers.py +0 -0
  34. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/quantization/lifecycle/initialize.py +0 -0
  35. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/quantization/observers/__init__.py +0 -0
  36. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/quantization/observers/base.py +0 -0
  37. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/quantization/observers/helpers.py +0 -0
  38. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/quantization/observers/memoryless.py +0 -0
  39. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/quantization/observers/min_max.py +0 -0
  40. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/quantization/observers/mse.py +0 -0
  41. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/quantization/quant_args.py +0 -0
  42. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/quantization/quant_config.py +0 -0
  43. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/quantization/utils/__init__.py +0 -0
  44. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/quantization/utils/helpers.py +0 -0
  45. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/registry/__init__.py +0 -0
  46. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/registry/registry.py +0 -0
  47. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/utils/__init__.py +0 -0
  48. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/utils/helpers.py +0 -0
  49. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/utils/offload.py +0 -0
  50. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/utils/permutations_24.py +0 -0
  51. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/utils/permute.py +0 -0
  52. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/utils/safetensors_load.py +0 -0
  53. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/utils/semi_structured_conversions.py +0 -0
  54. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors/version.py +0 -0
  55. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors_nightly.egg-info/SOURCES.txt +0 -0
  56. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors_nightly.egg-info/dependency_links.txt +0 -0
  57. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors_nightly.egg-info/requires.txt +0 -0
  58. {compressed-tensors-nightly-0.6.0.20240923 → compressed-tensors-nightly-0.6.0.20240925}/src/compressed_tensors_nightly.egg-info/top_level.txt +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: compressed-tensors-nightly
3
- Version: 0.6.0.20240923
3
+ Version: 0.6.0.20240925
4
4
  Summary: Library for utilization of compressed safetensors of neural network models
5
5
  Home-page: https://github.com/neuralmagic/compressed-tensors
6
6
  Author: Neuralmagic, Inc.
@@ -19,3 +19,4 @@ from .compressors import *
19
19
  from .config import *
20
20
  from .quantization import QuantizationConfig, QuantizationStatus
21
21
  from .utils import *
22
+ from .version import *
@@ -22,6 +22,7 @@ from typing import Any, Dict, Optional, Union
22
22
 
23
23
  import torch
24
24
  import transformers
25
+ import compressed_tensors
25
26
  from compressed_tensors.base import (
26
27
  COMPRESSION_CONFIG_NAME,
27
28
  QUANTIZATION_CONFIG_NAME,
@@ -368,6 +369,7 @@ class ModelCompressor:
368
369
  config_data[COMPRESSION_CONFIG_NAME][
369
370
  SPARSITY_CONFIG_NAME
370
371
  ] = sparsity_config_data
372
+ config_data[COMPRESSION_CONFIG_NAME]["version"] = compressed_tensors.__version__
371
373
 
372
374
  with open(config_file_path, "w") as config_file:
373
375
  json.dump(config_data, config_file, indent=2, sort_keys=True)
@@ -108,7 +108,7 @@ def is_preset_scheme(name: str) -> bool:
108
108
  UNQUANTIZED = dict()
109
109
 
110
110
  # 8 bit integer weights and 8 bit activations quantization
111
- W8A8 = dict(
111
+ INT8_W8A8 = dict(
112
112
  weights=QuantizationArgs(
113
113
  num_bits=8,
114
114
  type=QuantizationType.INT,
@@ -149,7 +149,7 @@ W4A16 = dict(
149
149
  )
150
150
 
151
151
  # 4 bit integer weights and 8 bit activations quantization
152
- W4A8 = dict(
152
+ INT8_W4A8 = dict(
153
153
  weights=QuantizationArgs(
154
154
  num_bits=4,
155
155
  type=QuantizationType.INT,
@@ -210,8 +210,9 @@ PRESET_SCHEMES = {
210
210
  "W8A16": W8A16,
211
211
  "W4A16": W4A16,
212
212
  # Integer weight and activation schemes
213
- "W8A8": W8A8,
214
- "W4A8": W4A8,
213
+ "W8A8": INT8_W8A8,
214
+ "INT8": INT8_W8A8, # alias for W8A8
215
+ "W4A8": INT8_W4A8,
215
216
  # Float weight and activation schemes
216
217
  "FP8": FP8,
217
218
  "FP8_DYNAMIC": FP8_DYNAMIC,
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: compressed-tensors-nightly
3
- Version: 0.6.0.20240923
3
+ Version: 0.6.0.20240925
4
4
  Summary: Library for utilization of compressed safetensors of neural network models
5
5
  Home-page: https://github.com/neuralmagic/compressed-tensors
6
6
  Author: Neuralmagic, Inc.