PyPI - mmgp - Versions diffs - 3.6.4__py3-none-any.whl → 3.6.6__py3-none-any.whl - Mend

mmgp 3.6.4py3-none-any.whl → 3.6.6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of mmgp might be problematic. Click here for more details.

Files changed (7) hide show

mmgp/offload.py +14 -5
{mmgp-3.6.4.dist-info → mmgp-3.6.6.dist-info}/METADATA +1 -1
mmgp-3.6.6.dist-info/RECORD +10 -0
{mmgp-3.6.4.dist-info → mmgp-3.6.6.dist-info}/licenses/LICENSE.md +1 -1
mmgp-3.6.4.dist-info/RECORD +0 -10
{mmgp-3.6.4.dist-info → mmgp-3.6.6.dist-info}/WHEEL +0 -0
{mmgp-3.6.4.dist-info → mmgp-3.6.6.dist-info}/top_level.txt +0 -0

mmgp/offload.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# ------------------ Memory Management 3.6.4 for the GPU Poor by DeepBeepMeep (mmgp)------------------
+# ------------------ Memory Management 3.6.6 for the GPU Poor by DeepBeepMeep (mmgp)------------------
 #
 # This module contains multiples optimisations so that models such as Flux (and derived), Mochi, CogView, HunyuanVideo, ...  can run smoothly on a 24 GB GPU limited card.
 # This a replacement for the accelerate library that should in theory manage offloading, but doesn't work properly with models that are loaded / unloaded several
@@ -63,7 +63,7 @@ import json
 import psutil
 import builtins
 from accelerate import init_empty_weights
+from functools import wraps
 import functools
 import types
@@ -86,6 +86,14 @@ class QEmbedding(QModuleMixin, torch.nn.Embedding):
+def cudacontext(device):
+    def decorator(func):
+        @wraps(func)
+        def wrapper(*args, **kwargs):
+            with torch.device(device):
+                return func(*args, **kwargs)
+        return wrapper
+    return decorator
 shared_state = {}
@@ -689,7 +697,7 @@ def _welcome():
     if welcome_displayed:
          return
     welcome_displayed = True
-    print(f"{BOLD}{HEADER}************ Memory Management for the GPU Poor (mmgp 3.6.4) by DeepBeepMeep ************{ENDC}{UNBOLD}")
+    print(f"{BOLD}{HEADER}************ Memory Management for the GPU Poor (mmgp 3.6.6) by DeepBeepMeep ************{ENDC}{UNBOLD}")
 def change_dtype(model, new_dtype, exclude_buffers = False):
     for submodule_name, submodule in model.named_modules():
@@ -1294,6 +1302,7 @@ def sync_models_loras(model, model2):
 def unload_loras_from_model(model):
     if model is None: return
+    if not hasattr(model, "_loras_model_data"): return
     for _, v in model._loras_model_data.items():
         v.clear()
     for _, v in model._loras_model_shortcuts.items():
@@ -1420,7 +1429,6 @@ def fast_load_transformers_model(model_path: str,  do_quantize = False, quantiza
             model = transfomer_class.from_config(transformer_config )
-    torch.set_default_device('cpu')
     model.eval().requires_grad_(False)
     model._config = transformer_config
@@ -1431,6 +1439,7 @@ def fast_load_transformers_model(model_path: str,  do_quantize = False, quantiza
+@cudacontext("cpu")
 def load_model_data(model, file_path, do_quantize = False, quantizationType = qint8, pinToMemory = False, partialPinning = False, modelPrefix = None, writable_tensors = True,  preprocess_sd = None, postprocess_sd = None, modules = None, return_shared_modules = None, default_dtype = torch.bfloat16, ignore_unused_weights = False, verboseLevel = -1):
     """
     Load a model, detect if it has been previously quantized using quanto and do the extra setup if necessary
@@ -1486,6 +1495,7 @@ def load_model_data(model, file_path, do_quantize = False, quantizationType = qi
     for no, file in enumerate(file_path):
         quantization_map = None
         tied_weights_map = None
+        metadata = None
         if not (".safetensors" in file or ".sft" in file):
             if pinToMemory:
                 raise Exception("Pinning to memory while loading only supported for safe tensors files")
@@ -1497,7 +1507,6 @@ def load_model_data(model, file_path, do_quantize = False, quantizationType = qi
             basename = os.path.basename(file)
             if "-of-" in basename:
-                metadata = None
                 file_parts= basename.split("-")
                 parts_max = int(file_parts[-1][:5])
                 state_dict = {}

{mmgp-3.6.4.dist-info → mmgp-3.6.6.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: mmgp
-Version: 3.6.4
+Version: 3.6.6
 Summary: Memory Management for the GPU Poor
 Author-email: deepbeepmeep <deepbeepmeep@yahoo.com>
 Requires-Python: >=3.10

mmgp-3.6.6.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,10 @@
+__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+mmgp/__init__.py,sha256=A9qBwyQMd1M7vshSTOBnFGP1MQvS2hXmTcTCMUcmyzE,509
+mmgp/fp8_quanto_bridge.py,sha256=VtUaD6wzo7Yn9vGY0LMtbhwt6KMWRpSWLc65bU_sfZU,21155
+mmgp/offload.py,sha256=Zd14BTWZ-Y_rcBzrKITimNQlMezIdzTkbhxbd-ggsrY,139244
+mmgp/safetensors2.py,sha256=zYNMprt1KoxgVALbcz6DawxsQDNNRImvgO9cYRChUiY,19028
+mmgp-3.6.6.dist-info/licenses/LICENSE.md,sha256=DD-WIS0BkPoWJ_8hQO3J8hMP9K_1-dyrYv1YCbkxcDU,94
+mmgp-3.6.6.dist-info/METADATA,sha256=B4y6VLFaEDAi3E59WV7fNNEFwS4HP9zT0UILUq7GOn0,16309
+mmgp-3.6.6.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
+mmgp-3.6.6.dist-info/top_level.txt,sha256=waGaepj2qVfnS2yAOkaMu4r9mJaVjGbEi6AwOUogU_U,14
+mmgp-3.6.6.dist-info/RECORD,,

{mmgp-3.6.4.dist-info → mmgp-3.6.6.dist-info}/licenses/LICENSE.md RENAMED Viewed

@@ -1,2 +1,2 @@
-                    GNU GENERAL PUBLIC LICENSE
+                    GNU GENERAL PUBLIC LICENSE
                        Version 3, 29 June 2007

mmgp-3.6.4.dist-info/RECORD DELETED Viewed

@@ -1,10 +0,0 @@
-__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-mmgp/__init__.py,sha256=A9qBwyQMd1M7vshSTOBnFGP1MQvS2hXmTcTCMUcmyzE,509
-mmgp/fp8_quanto_bridge.py,sha256=VtUaD6wzo7Yn9vGY0LMtbhwt6KMWRpSWLc65bU_sfZU,21155
-mmgp/offload.py,sha256=hRSLKfUY_7bMRS2BUv79cB4BGjub5uLhVpZuoc9AWTI,138940
-mmgp/safetensors2.py,sha256=zYNMprt1KoxgVALbcz6DawxsQDNNRImvgO9cYRChUiY,19028
-mmgp-3.6.4.dist-info/licenses/LICENSE.md,sha256=HjzvY2grdtdduZclbZ46B2M-XpT4MDCxFub5ZwTWq2g,93
-mmgp-3.6.4.dist-info/METADATA,sha256=e2NavzQQfgehOKy1KRyy_I2sL3tIpePcBHMzlvFDOGE,16309
-mmgp-3.6.4.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
-mmgp-3.6.4.dist-info/top_level.txt,sha256=waGaepj2qVfnS2yAOkaMu4r9mJaVjGbEi6AwOUogU_U,14
-mmgp-3.6.4.dist-info/RECORD,,

{mmgp-3.6.4.dist-info → mmgp-3.6.6.dist-info}/WHEEL RENAMED Viewed

File without changes

{mmgp-3.6.4.dist-info → mmgp-3.6.6.dist-info}/top_level.txt RENAMED Viewed

File without changes

mmgp 3.6.4__py3-none-any.whl → 3.6.6__py3-none-any.whl

Potentially problematic release.

mmgp 3.6.4py3-none-any.whl → 3.6.6py3-none-any.whl