compressed-tensors-nightly 0.7.1.20241022__py3-none-any.whl → 0.7.1.20241024__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- compressed_tensors/quantization/lifecycle/calibration.py +2 -4
- compressed_tensors/quantization/lifecycle/frozen.py +0 -1
- compressed_tensors/quantization/observers/helpers.py +1 -1
- compressed_tensors/quantization/observers/mse.py +3 -1
- {compressed_tensors_nightly-0.7.1.20241022.dist-info → compressed_tensors_nightly-0.7.1.20241024.dist-info}/METADATA +1 -1
- {compressed_tensors_nightly-0.7.1.20241022.dist-info → compressed_tensors_nightly-0.7.1.20241024.dist-info}/RECORD +9 -9
- {compressed_tensors_nightly-0.7.1.20241022.dist-info → compressed_tensors_nightly-0.7.1.20241024.dist-info}/LICENSE +0 -0
- {compressed_tensors_nightly-0.7.1.20241022.dist-info → compressed_tensors_nightly-0.7.1.20241024.dist-info}/WHEEL +0 -0
- {compressed_tensors_nightly-0.7.1.20241022.dist-info → compressed_tensors_nightly-0.7.1.20241024.dist-info}/top_level.txt +0 -0
@@ -64,14 +64,12 @@ def set_module_for_calibration(module: Module, quantize_weights_upfront: bool =
|
|
64
64
|
quantization_args=module.quantization_scheme.weights,
|
65
65
|
)
|
66
66
|
|
67
|
-
observer = module.weight_observer
|
68
|
-
|
69
|
-
g_idx = getattr(module, "weight_g_idx", None)
|
70
|
-
|
71
67
|
offloaded = is_module_offloaded(module)
|
72
68
|
if offloaded:
|
73
69
|
module._hf_hook.pre_forward(module)
|
74
70
|
|
71
|
+
observer = module.weight_observer
|
72
|
+
g_idx = getattr(module, "weight_g_idx", None)
|
75
73
|
scale, zero_point = observer(module.weight, g_idx=g_idx)
|
76
74
|
update_parameter_data(module, scale, "weight_scale")
|
77
75
|
update_parameter_data(module, zero_point, "weight_zero_point")
|
@@ -70,7 +70,9 @@ class MovingAverageMSEObserver(Observer):
|
|
70
70
|
absolute_min_val = torch.amin(observed, dim=reduce_dims, keepdims=True)
|
71
71
|
absolute_max_val = torch.amax(observed, dim=reduce_dims, keepdims=True)
|
72
72
|
|
73
|
-
best = torch.full_like(
|
73
|
+
best = torch.full_like(
|
74
|
+
absolute_min_val, torch.finfo(absolute_min_val.dtype).max
|
75
|
+
)
|
74
76
|
min_val = torch.ones_like(absolute_min_val)
|
75
77
|
max_val = torch.zeros_like(absolute_max_val)
|
76
78
|
for i in range(int(self.maxshrink * self.grid)):
|
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.1
|
2
2
|
Name: compressed-tensors-nightly
|
3
|
-
Version: 0.7.1.
|
3
|
+
Version: 0.7.1.20241024
|
4
4
|
Summary: Library for utilization of compressed safetensors of neural network models
|
5
5
|
Home-page: https://github.com/neuralmagic/compressed-tensors
|
6
6
|
Author: Neuralmagic, Inc.
|
@@ -29,17 +29,17 @@ compressed_tensors/quantization/quant_config.py,sha256=NCiMvUMnnz5kTyAkDylxjtEGQ
|
|
29
29
|
compressed_tensors/quantization/quant_scheme.py,sha256=5ggPz5sqEfTUgvJJeiPIINA74QtO-08hb3szsm7UHGE,6000
|
30
30
|
compressed_tensors/quantization/lifecycle/__init__.py,sha256=MXE2E7GfIfRRfhrdGy2Og3AZOz5N59B0ZGFcsD89y6c,821
|
31
31
|
compressed_tensors/quantization/lifecycle/apply.py,sha256=czaayvpeUYyWRJhO_klffw6esptOgA9sBKL5TWQcRdw,15805
|
32
|
-
compressed_tensors/quantization/lifecycle/calibration.py,sha256=
|
32
|
+
compressed_tensors/quantization/lifecycle/calibration.py,sha256=fJ2RDL3E4hmWR8v8nYhq_tv31K8WV00o_4Y3xr7c37Y,3041
|
33
33
|
compressed_tensors/quantization/lifecycle/compressed.py,sha256=Fj9n66IN0EWsOAkBHg3O0GlOQpxstqjCcs0ttzMXrJ0,2296
|
34
34
|
compressed_tensors/quantization/lifecycle/forward.py,sha256=8GjOnx4rwOZZqSDTdnejNOY2DVTjNDzH0DfY_rQam6k,16575
|
35
|
-
compressed_tensors/quantization/lifecycle/frozen.py,sha256=
|
35
|
+
compressed_tensors/quantization/lifecycle/frozen.py,sha256=71TsgS0Uxku0NomdWOBJsVfXCGTne-Gx9zUEMsCmw5Q,1764
|
36
36
|
compressed_tensors/quantization/lifecycle/helpers.py,sha256=C0mhy2vJ0fCjVeN4kFNhw8Eq1wkteBGHiZ36RVLThRY,944
|
37
37
|
compressed_tensors/quantization/lifecycle/initialize.py,sha256=lKoFy18PjbSklyum7f4hoLuWtHShBKax7JDTBzPlCqM,8839
|
38
38
|
compressed_tensors/quantization/observers/__init__.py,sha256=DYrttzq-8MHLZUzpX-xzzm4hrw6HcXkMkux82KBKb1M,738
|
39
39
|
compressed_tensors/quantization/observers/base.py,sha256=5ovQicWPYHjIxr6-EkQ4lgOX0PpI9g23iSzKpxjM1Zg,8420
|
40
|
-
compressed_tensors/quantization/observers/helpers.py,sha256=
|
40
|
+
compressed_tensors/quantization/observers/helpers.py,sha256=nUFdNEIACiPBfFwNYDGCXOvw6tf7j6jfTvDwImHKMPg,5506
|
41
41
|
compressed_tensors/quantization/observers/min_max.py,sha256=sQXqU3z-voxIDfR_9mQzwQUflZj2sASm_G8CYaXntFw,3865
|
42
|
-
compressed_tensors/quantization/observers/mse.py,sha256=
|
42
|
+
compressed_tensors/quantization/observers/mse.py,sha256=G5Y9v4MqXUVcKxBSmCFFW3p_7rlu-6scqLIN88ng-sE,6080
|
43
43
|
compressed_tensors/quantization/utils/__init__.py,sha256=VdtEmP0bvuND_IGQnyqUPc5lnFp-1_yD7StKSX4x80w,656
|
44
44
|
compressed_tensors/quantization/utils/helpers.py,sha256=y4LEyC2oUd876ZMdALWKGH3Ct5EgBJZV4id_NUjTGH8,9531
|
45
45
|
compressed_tensors/registry/__init__.py,sha256=FwLSNYqfIrb5JD_6OK_MT4_svvKTN_nEhpgQlQvGbjI,658
|
@@ -51,8 +51,8 @@ compressed_tensors/utils/permutations_24.py,sha256=kx6fsfDHebx94zsSzhXGyCyuC9sVy
|
|
51
51
|
compressed_tensors/utils/permute.py,sha256=V6tJLKo3Syccj-viv4F7ZKZgJeCB-hl-dK8RKI_kBwI,2355
|
52
52
|
compressed_tensors/utils/safetensors_load.py,sha256=m08ANVuTBxQdoa6LufDgcNJ7wCLDJolyZljB8VEybAU,8578
|
53
53
|
compressed_tensors/utils/semi_structured_conversions.py,sha256=XKNffPum54kPASgqKzgKvyeqWPAkair2XEQXjkp7ho8,13489
|
54
|
-
compressed_tensors_nightly-0.7.1.
|
55
|
-
compressed_tensors_nightly-0.7.1.
|
56
|
-
compressed_tensors_nightly-0.7.1.
|
57
|
-
compressed_tensors_nightly-0.7.1.
|
58
|
-
compressed_tensors_nightly-0.7.1.
|
54
|
+
compressed_tensors_nightly-0.7.1.20241024.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
|
55
|
+
compressed_tensors_nightly-0.7.1.20241024.dist-info/METADATA,sha256=-Xf19M04eOlSXjbE9plgrWpGGXCv1B6H_ehjopS6CLs,6799
|
56
|
+
compressed_tensors_nightly-0.7.1.20241024.dist-info/WHEEL,sha256=eOLhNAGa2EW3wWl_TU484h7q1UNgy0JXjjoqKoxAAQc,92
|
57
|
+
compressed_tensors_nightly-0.7.1.20241024.dist-info/top_level.txt,sha256=w2i-GyPs2s1UwVxvutSvN_lM22SXC2hQFBmoMcPnV7Y,19
|
58
|
+
compressed_tensors_nightly-0.7.1.20241024.dist-info/RECORD,,
|
File without changes
|
File without changes
|