PyPI - compressed-tensors - Versions diffs - 0.9.3__py3-none-any.whl → 0.9.4a20250410__py3-none-any.whl - Mend

compressed-tensors 0.9.3py3-none-any.whl → 0.9.4a20250410py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

compressed_tensors/quantization/quant_config.py CHANGED Viewed

@@ -230,10 +230,6 @@ class QuantizationConfig(BaseModel):
             group_name = "group_" + str(idx)
             config_groups[group_name] = scheme
-        # TODO: this is incorrect in compressed mode, since we are overwriting the
-        # original weight we lose the uncompressed bit_depth indo
-        compression_ratio = calculate_compression_ratio(model)
         if format is None:
             if quantization_status == QuantizationStatus.COMPRESSED:
                 format = CompressionFormat.int_quantized.value
@@ -244,7 +240,7 @@ class QuantizationConfig(BaseModel):
             config_groups=config_groups,
             quantization_status=quantization_status,
             kv_cache_scheme=kv_cache_scheme,
-            global_compression_ratio=compression_ratio,
+            global_compression_ratio=None,
             format=format,
             ignore=consolidated_ignore,
         )

compressed_tensors/quantization/quant_scheme.py CHANGED Viewed

@@ -142,6 +142,18 @@ W4A16 = dict(
     ),
 )
+# 4 bit integer weights only asymmetric quantization
+W4A16_ASYM = dict(
+    weights=QuantizationArgs(
+        num_bits=4,
+        type=QuantizationType.INT,
+        strategy=QuantizationStrategy.GROUP,
+        group_size=128,
+        symmetric=False,
+        dynamic=False,
+    ),
+)
 # 4 bit integer weights and 8 bit activations quantization
 INT8_W4A8 = dict(
     weights=QuantizationArgs(
@@ -205,6 +217,7 @@ PRESET_SCHEMES = {
     # Integer weight only schemes
     "W8A16": W8A16,
     "W4A16": W4A16,
+    "W4A16_ASYM": W4A16_ASYM,
     # Integer weight and activation schemes
     "W8A8": INT8_W8A8,
     "INT8": INT8_W8A8,  # alias for W8A8

compressed_tensors/quantization/utils/helpers.py CHANGED Viewed

@@ -64,8 +64,11 @@ def calculate_qparams(
     :param quantization_args: settings to quantization
     :return: tuple of the calculated scale(s) and zero point(s)
     """
+    # based on the implementations for consuming quantized values,
+    # 0.0 must always be representable within the quantized range
     min_vals = torch.min(min_vals, torch.zeros_like(min_vals))
     max_vals = torch.max(max_vals, torch.zeros_like(max_vals))
     device = min_vals.device
     bit_min, bit_max = calculate_range(quantization_args, device)
@@ -84,6 +87,9 @@ def calculate_qparams(
         zero_points = torch.clamp(zero_points, bit_min, bit_max)
     # match zero-points to quantized type
+    # if casting to int, use round instead of truncate
+    if quantization_args.type == QuantizationType.INT:
+        zero_points = torch.round(zero_points)
     zero_points = zero_points.to(zp_dtype)
     if scales.ndim == 0:
@@ -96,7 +102,7 @@ def calculate_qparams(
 def compute_dynamic_scales_and_zp(value: Tensor, args: QuantizationArgs):
     """
     Returns the computed scales and zero points for dynamic activation
-    qunatization.
+    quantization.
     :param value: tensor to calculate quantization parameters for
     :param args: quantization args

compressed_tensors/version.py CHANGED Viewed

@@ -1,53 +1,21 @@
-# Copyright (c) 2021 - present / Neuralmagic, Inc. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing,
-# software distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
+# file generated by setuptools-scm
+# don't change, don't track in version control
-"""
-Functionality for storing and setting the version info for SparseML
-"""
+__all__ = ["__version__", "__version_tuple__", "version", "version_tuple"]
+TYPE_CHECKING = False
+if TYPE_CHECKING:
+    from typing import Tuple
+    from typing import Union
-version_base = "0.9.3"
-is_release = True  # change to True to set the generated version as a release version
+    VERSION_TUPLE = Tuple[Union[int, str], ...]
+else:
+    VERSION_TUPLE = object
+version: str
+__version__: str
+__version_tuple__: VERSION_TUPLE
+version_tuple: VERSION_TUPLE
-def _generate_version(
-    is_release: bool,
-    version_base: str,
-):
-    from datetime import date
-    if is_release:
-        return version_base
-    else:
-        return f"{version_base}.{date.today().strftime('%Y%m%d')}"
-__all__ = [
-    "__version__",
-    "version_base",
-    "is_release",
-    "version",
-    "version_major",
-    "version_minor",
-    "version_patch",
-    "version_build",
-    "version_major_minor",
-]
-__version__ = _generate_version(is_release, version_base)
-version = __version__
-version_major, version_minor, version_patch, version_build = version.split(".") + (
-    [None] if len(version.split(".")) < 4 else []
-)  # handle conditional for version being 3 parts or 4 (4 containing build date)
-version_major_minor = f"{version_major}.{version_minor}"
+__version__ = version = '0.9.4a20250410'
+__version_tuple__ = version_tuple = (0, 9, 4)

{compressed_tensors-0.9.3.dist-info → compressed_tensors-0.9.4a20250410.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: compressed-tensors
-Version: 0.9.3
+Version: 0.9.4a20250410
 Summary: Library for utilization of compressed safetensors of neural network models
 Home-page: https://github.com/neuralmagic/compressed-tensors
 Author: Neuralmagic, Inc.
@@ -64,7 +64,7 @@ pip install compressed-tensors
 Nightly release:
 ```bash
-pip install compressed-tensors-nightly
+pip install --pre compressed-tensors
 ```
 ### From Source

{compressed_tensors-0.9.3.dist-info → compressed_tensors-0.9.4a20250410.dist-info}/RECORD RENAMED Viewed

@@ -1,6 +1,6 @@
 compressed_tensors/__init__.py,sha256=UtKmifNeBCSE2TZSAfduVNNzHY-3V7bLjZ7n7RuXLOE,812
 compressed_tensors/base.py,sha256=73HYH7HY7O2roC89yG_piPFnZwrBfn_i7HmKl90SKc0,875
-compressed_tensors/version.py,sha256=X4y5lqlF1QFUgl25iumzagpg3dzyVoLP6i82HZEhCJA,1585
+compressed_tensors/version.py,sha256=ttCtltINyBJn0un6r4KDJzCF49mLYcu-E_khCO2nku8,520
 compressed_tensors/compressors/__init__.py,sha256=smSygTSfcfuujRrAXDc6uZm4L_ccV1tWZewqVnOb4lM,825
 compressed_tensors/compressors/base.py,sha256=x8dQrWVEurynXw03yHJZTaAmrRTOsdZJoHjmvs0IKwk,7002
 compressed_tensors/compressors/helpers.py,sha256=OK6qxX9j3bHwF9JfIYSGMgBJe2PWjlTA3byXKCJaTIQ,5431
@@ -26,8 +26,8 @@ compressed_tensors/linear/__init__.py,sha256=fH6rjBYAxuwrTzBTlTjTgCYNyh6TCvCqajC
 compressed_tensors/linear/compressed_linear.py,sha256=_m6XpNcI53eeSHO8VdiuAM6UBTdpDhn5Ivd8iRMwEKc,3980
 compressed_tensors/quantization/__init__.py,sha256=83J5bPB7PavN2TfCoW7_vEDhfYpm4TDrqYO9vdSQ5bk,760
 compressed_tensors/quantization/quant_args.py,sha256=sKpb8DcNObidjXjNol1Tn_Iih3ZXBycSp-fyz68TGhY,9117
-compressed_tensors/quantization/quant_config.py,sha256=vx06wBo91p4LCb3Vzd-2eCTUeIf_Sz2ZXRP263eQyjQ,10385
-compressed_tensors/quantization/quant_scheme.py,sha256=eQ0JrRZ80GX69fpwW87VzPzzhajhk4mUaJScjk82OY4,6010
+compressed_tensors/quantization/quant_config.py,sha256=MxSUcb5dOqMN6LFyD5K2h8X0TvEtcWIAoiUJqD2dHGE,10159
+compressed_tensors/quantization/quant_scheme.py,sha256=yz0oMbbwp7QZXXd2k5KIJu-Q6aTqg2929VdUzZ7vysM,6324
 compressed_tensors/quantization/lifecycle/__init__.py,sha256=_uItzFWusyV74Zco_pHLOTdE9a83cL-R-ZdyQrBkIyw,772
 compressed_tensors/quantization/lifecycle/apply.py,sha256=lZmCCSm1_o79iUAy460w6Bv9FaOvntVisMdS-dN9fnk,16594
 compressed_tensors/quantization/lifecycle/compressed.py,sha256=Fj9n66IN0EWsOAkBHg3O0GlOQpxstqjCcs0ttzMXrJ0,2296
@@ -35,7 +35,7 @@ compressed_tensors/quantization/lifecycle/forward.py,sha256=DOWouUqfaLA4Qhg-ojVV
 compressed_tensors/quantization/lifecycle/helpers.py,sha256=C0mhy2vJ0fCjVeN4kFNhw8Eq1wkteBGHiZ36RVLThRY,944
 compressed_tensors/quantization/lifecycle/initialize.py,sha256=sK3PLm69N91QepBuq-83Qd2Br6XcOmRDpD5qo_WWNJo,7469
 compressed_tensors/quantization/utils/__init__.py,sha256=VdtEmP0bvuND_IGQnyqUPc5lnFp-1_yD7StKSX4x80w,656
-compressed_tensors/quantization/utils/helpers.py,sha256=DBP-sGRpGAY01K0LFE7qqonNj4hkTYL_mXrMs2LtAD8,14100
+compressed_tensors/quantization/utils/helpers.py,sha256=-wX0H7zVysJ67jRRCGbx6BfxbMU_1sqffTf5YUIpPiU,14391
 compressed_tensors/registry/__init__.py,sha256=FwLSNYqfIrb5JD_6OK_MT4_svvKTN_nEhpgQlQvGbjI,658
 compressed_tensors/registry/registry.py,sha256=vRcjVB1ITfSbfYUaGndBBmqhip_5vsS62weorVg0iXo,11896
 compressed_tensors/utils/__init__.py,sha256=gS4gSU2pwcAbsKj-6YMaqhm25udFy6ISYaWBf-myRSM,808
@@ -45,8 +45,8 @@ compressed_tensors/utils/permutations_24.py,sha256=kx6fsfDHebx94zsSzhXGyCyuC9sVy
 compressed_tensors/utils/permute.py,sha256=V6tJLKo3Syccj-viv4F7ZKZgJeCB-hl-dK8RKI_kBwI,2355
 compressed_tensors/utils/safetensors_load.py,sha256=5SeM2hzLh77Ne8Vk7qR6-km7cf8bhov41ExpWITqX3A,11470
 compressed_tensors/utils/semi_structured_conversions.py,sha256=XKNffPum54kPASgqKzgKvyeqWPAkair2XEQXjkp7ho8,13489
-compressed_tensors-0.9.3.dist-info/licenses/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
-compressed_tensors-0.9.3.dist-info/METADATA,sha256=zs3aFaG-BGV9hqJbW9Zwzex0TVcM5sPZhiaeVx2qjR0,6997
-compressed_tensors-0.9.3.dist-info/WHEEL,sha256=CmyFI0kx5cdEMTLiONQRbGQwjIoR1aIYB7eCAQ4KPJ0,91
-compressed_tensors-0.9.3.dist-info/top_level.txt,sha256=w2i-GyPs2s1UwVxvutSvN_lM22SXC2hQFBmoMcPnV7Y,19
-compressed_tensors-0.9.3.dist-info/RECORD,,
+compressed_tensors-0.9.4a20250410.dist-info/licenses/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
+compressed_tensors-0.9.4a20250410.dist-info/METADATA,sha256=EKD2EHV9dh7GHjeO25QvapLLR3JabT4WC04IU6K-cLg,7004
+compressed_tensors-0.9.4a20250410.dist-info/WHEEL,sha256=CmyFI0kx5cdEMTLiONQRbGQwjIoR1aIYB7eCAQ4KPJ0,91
+compressed_tensors-0.9.4a20250410.dist-info/top_level.txt,sha256=w2i-GyPs2s1UwVxvutSvN_lM22SXC2hQFBmoMcPnV7Y,19
+compressed_tensors-0.9.4a20250410.dist-info/RECORD,,

{compressed_tensors-0.9.3.dist-info → compressed_tensors-0.9.4a20250410.dist-info}/WHEEL RENAMED Viewed

File without changes

{compressed_tensors-0.9.3.dist-info → compressed_tensors-0.9.4a20250410.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

{compressed_tensors-0.9.3.dist-info → compressed_tensors-0.9.4a20250410.dist-info}/top_level.txt RENAMED Viewed

File without changes

compressed-tensors 0.9.3__py3-none-any.whl → 0.9.4a20250410__py3-none-any.whl

compressed-tensors 0.9.3py3-none-any.whl → 0.9.4a20250410py3-none-any.whl