PyPI - bayesianflow-for-chem - Versions diffs - 1.2.2__py3-none-any.whl → 1.2.4__py3-none-any.whl - Mend

bayesianflow-for-chem 1.2.2py3-none-any.whl → 1.2.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of bayesianflow-for-chem might be problematic. Click here for more details.

Files changed (9) hide show

bayesianflow_for_chem/__init__.py CHANGED Viewed

@@ -7,5 +7,5 @@ from . import data, tool, train, scorer
 from .model import ChemBFN, MLP
 __all__ = ["data", "tool", "train", "scorer", "ChemBFN", "MLP"]
-__version__ = "1.2.2"
+__version__ = "1.2.4"
 __author__ = "Nianze A. Tao (Omozawa Sueno)"

bayesianflow_for_chem/model.py CHANGED Viewed

@@ -847,7 +847,7 @@ class ChemBFN(nn.Module):
         with open(ckpt, "rb") as f:
             state = torch.load(f, "cpu", weights_only=True)
         nn, hparam = state["nn"], state["hparam"]
-        model = ChemBFN(
+        model = cls(
             hparam["num_vocab"],
             hparam["channel"],
             hparam["num_layer"],
@@ -926,7 +926,7 @@ class MLP(nn.Module):
         with open(ckpt, "rb") as f:
             state = torch.load(f, "cpu", weights_only=True)
         nn, hparam = state["nn"], state["hparam"]
-        model = MLP(hparam["size"], hparam["class_input"], hparam["dropout"])
+        model = cls(hparam["size"], hparam["class_input"], hparam["dropout"])
         model.load_state_dict(nn, strict)
         return model

bayesianflow_for_chem/tool.py CHANGED Viewed

@@ -6,17 +6,16 @@ Tools.
 import re
 import csv
 import random
+from copy import deepcopy
 from pathlib import Path
 from typing import List, Dict, Tuple, Union, Optional
 import torch
 import numpy as np
+import torch.nn as nn
 from torch import cuda, Tensor, softmax
+from torch.ao import quantization
 from torch.utils.data import DataLoader
-from torch.ao.quantization.quantize_pt2e import prepare_pt2e, convert_pt2e
-from torch.ao.quantization.quantizer.xnnpack_quantizer import (
-    XNNPACKQuantizer,
-    get_symmetric_quantization_config,
-)
+from typing_extensions import Self
 from rdkit.Chem import rdDetermineBonds, Bond, MolFromXYZBlock, CanonicalRankAtoms
 from rdkit.Chem.Scaffolds.MurckoScaffold import MurckoScaffoldSmiles  # type: ignore
 from sklearn.metrics import (
@@ -38,7 +37,7 @@ except ImportError:
     _use_pynauty = False
 from .data import VOCAB_KEYS
-from .model import ChemBFN, MLP
+from .model import ChemBFN, MLP, Linear
 _atom_regex_pattern = (
@@ -385,10 +384,7 @@ def sample(
     assert method.split(":")[0].lower() in ("ode", "bfn")
     if device is None:
         device = _find_device()
-    model.to(device)
-    if not isinstance(model, torch.fx.GraphModule):
-        model.eval()  # Calling eval() is not supported for GraphModule
-    # model.to(device).eval()
+    model.to(device).eval()
     if y is not None:
         y = y.to(device)
     if isinstance(allowed_tokens, list):
@@ -463,10 +459,7 @@ def inpaint(
     assert method.split(":")[0].lower() in ("ode", "bfn")
     if device is None:
         device = _find_device()
-    model.to(device)
-    if not isinstance(model, torch.fx.GraphModule):
-        model.eval()  # Calling eval() is not supported for GraphModule
-    # model.to(device).eval()
+    model.to(device).eval()
     x = x.to(device)
     if y is not None:
         y = y.to(device)
@@ -497,52 +490,124 @@ def inpaint(
     ]
-def quantise_model(
-    model: ChemBFN, dataloader: DataLoader, mlp: Optional[MLP] = None
-) -> torch.fx.GraphModule:
+def quantise_model(model: ChemBFN) -> nn.Module:
     """
-    Static quantisation of the input model.
+    Dynamic quantisation of the trained model.
     :param model: trained ChemBFN model
-    :param dataloader: DataLoader instance containing example data for calibration
-    :param mlp: trained MLP model (guidance) if applied
     :type model: bayesianflow_for_chem.model.ChemBFN
-    :type dataloader: torch.utils.data.DataLoader
-    :type mlp: bayesianflow_for_chem.model.MLP | None
     :return: quantised model
-    :rtype: torch.fx.GraphModule
+    :rtype: torch.nn.Module
     """
-    nb, nt = dataloader._get_iterator()._next_data()["token"].shape
-    x = 2 * softmax(torch.rand((nb, nt, model.K)), -1) - 1
-    t = torch.rand((nb, 1, 1))
-    y = torch.randn(nb, 1, model.embedding.weight.shape[0]) if mlp is not None else None
-    example_input = (2 * x - 1, t, None, y)
-    graph_model = torch.export.export_for_training(model, example_input).module()
-    quantizer = XNNPACKQuantizer().set_global(get_symmetric_quantization_config())
-    prepared_model = prepare_pt2e(graph_model, quantizer)
-    # ------- calibration -------
-    with torch.inference_mode():
-        for data in dataloader:
-            x = data["token"]
-            if x.shape[0] != nb:
-                break
-            if mlp is not None:
-                y = mlp(data["value"])[:, None, :]
+    from torch.ao.nn.quantized.modules.utils import _quantize_weight
+    from torch.ao.nn.quantized import dynamic
+    class QuantisedLinear(dynamic.Linear):
+        # Modified from https://github.com/pytorch/pytorch/blob/main/torch/ao/nn/quantized/dynamic/modules/linear.py
+        # We made it compatible with our LoRA linear layer.
+        # LoRA parameters will not be quantised.
+        def __init__(
+            self,
+            in_features: int,
+            out_features: int,
+            bias_: bool = True,
+            dtype: torch.dtype = torch.qint8,
+        ) -> None:
+            super().__init__(in_features, out_features, bias_, dtype=dtype)
+            self.version = self._version
+            self.lora_enabled: bool = False
+            self.lora_A: Optional[nn.Parameter] = None
+            self.lora_B: Optional[nn.Parameter] = None
+            self.scaling: Optional[float] = None
+            self.lora_dropout: Optional[float] = None
+        def enable_lora(
+            self, r: int = 8, lora_alpha: int = 1, lora_dropout: float = 0.0
+        ) -> None:
+            assert r > 0, "Rank should be larger than 0."
+            device = self._weight_bias()[0].device
+            self.lora_A = nn.Parameter(
+                torch.zeros((r, self.in_features), device=device)
+            )
+            self.lora_B = nn.Parameter(
+                torch.zeros((self.out_features, r), device=device)
+            )
+            self.scaling = lora_alpha / r
+            self.lora_dropout = lora_dropout
+            self.lora_enabled = True
+            nn.init.kaiming_uniform_(self.lora_A, a=5**0.5)
+            nn.init.zeros_(self.lora_B)
+            self._packed_params.requires_grad_(False)
+        def forward(self, x: Tensor) -> Tensor:
+            # Note that we can handle self.bias == None case.
+            if self._packed_params.dtype == torch.qint8:
+                if self.version is None or self.version < 4:
+                    Y = torch.ops.quantized.linear_dynamic(
+                        x, self._packed_params._packed_params
+                    )
+                else:
+                    Y = torch.ops.quantized.linear_dynamic(
+                        x, self._packed_params._packed_params, reduce_range=True
+                    )
+            elif self._packed_params.dtype == torch.float16:
+                Y = torch.ops.quantized.linear_dynamic_fp16(
+                    x, self._packed_params._packed_params
+                )
+            else:
+                raise RuntimeError("Unsupported dtype on dynamic quantized linear!")
+            result = Y.to(x.dtype)
+            if self.lora_enabled and isinstance(self.lora_dropout, float):
+                result += (
+                    nn.functional.dropout(x, self.lora_dropout, self.training)
+                    @ self.lora_A.transpose(0, 1)
+                    @ self.lora_B.transpose(0, 1)
+                ) * self.scaling
+            return result
+        @classmethod
+        def from_float(
+            cls, mod: Linear, use_precomputed_fake_quant: bool = False
+        ) -> Self:
+            assert hasattr(
+                mod, "qconfig"
+            ), "Input float module must have qconfig defined"
+            if mod.qconfig is not None and mod.qconfig.weight is not None:
+                weight_observer = mod.qconfig.weight()
             else:
-                y = None
-            t = torch.rand((x.shape[0], 1, 1))
-            beta = model.calc_beta(t)
-            e_x = torch.nn.functional.one_hot(x, model.K).float()
-            mu = beta * (model.K * e_x - 1)
-            sigma = (beta * model.K).sqrt()
-            theta = softmax(mu + sigma * torch.randn_like(mu), -1)
-            prepared_model(2 * theta - 1, t, None, y)
-    quantised_model = convert_pt2e(prepared_model)
-    quantised_model = torch.export.export_for_training(
-        quantised_model, example_input
-    ).module()  # remove the weights of original model
-    quantised_model.sample = model.sample
-    quantised_model.ode_sample = model.ode_sample
-    quantised_model.inpaint = model.inpaint
-    quantised_model.ode_inpaint = model.ode_inpaint
+                # We have the circular import issues if we import the qconfig in the beginning of this file:
+                # https://github.com/pytorch/pytorch/pull/24231. The current workaround is to postpone the
+                # import until we need it.
+                from torch.ao.quantization.qconfig import default_dynamic_qconfig
+                weight_observer = default_dynamic_qconfig.weight()
+            dtype = weight_observer.dtype
+            assert dtype in [torch.qint8, torch.float16], (
+                "The only supported dtypes for "
+                f"dynamic quantized linear are qint8 and float16 got: {dtype}"
+            )
+            weight_observer(mod.weight)
+            if dtype == torch.qint8:
+                qweight = _quantize_weight(mod.weight.float(), weight_observer)
+            elif dtype == torch.float16:
+                qweight = mod.weight.float()
+            else:
+                raise RuntimeError(
+                    "Unsupported dtype specified for dynamic quantized Linear!"
+                )
+            qlinear = cls(mod.in_features, mod.out_features, dtype=dtype)
+            qlinear.set_weight_bias(qweight, mod.bias)
+            if mod.lora_enabled:
+                qlinear.lora_enabled = True
+                qlinear.lora_A = mod.lora_A
+                qlinear.lora_B = mod.lora_B
+                qlinear.scaling = mod.scaling
+                qlinear.lora_dropout = mod.lora_dropout
+            return qlinear
+    mapping = deepcopy(quantization.DEFAULT_DYNAMIC_QUANT_MODULE_MAPPINGS)
+    mapping[Linear] = QuantisedLinear
+    quantised_model = quantization.quantize_dynamic(
+        model, {nn.Linear, Linear}, torch.qint8, mapping
+    )
     return quantised_model

{bayesianflow_for_chem-1.2.2.dist-info → bayesianflow_for_chem-1.2.4.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.2
 Name: bayesianflow_for_chem
-Version: 1.2.2
+Version: 1.2.4
 Summary: Bayesian flow network framework for Chemistry
 Home-page: https://augus1999.github.io/bayesian-flow-network-for-chemistry/
 Author: Nianze A. Tao

bayesianflow_for_chem-1.2.4.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,12 @@
+bayesianflow_for_chem/__init__.py,sha256=-_0xD4lo_Vn2GrlXG-y13MCTwDfj391kzgTnyLplkNk,293
+bayesianflow_for_chem/data.py,sha256=9tpRba40lxwrB6aPSJMkxUglEVC3VEQC9wWxhDuz3Q8,7760
+bayesianflow_for_chem/model.py,sha256=HvEvW_xRbkv4eSv5lhd72BJMZkg-ZACEi1DAW3p5Q1Y,35918
+bayesianflow_for_chem/scorer.py,sha256=mV1vX8aBGFra2BE7N8WHihVIo3dXmUdPQIGfSaiuNdk,4084
+bayesianflow_for_chem/tool.py,sha256=d-g47Ctn6qb_j1bWCWV99ytUxJ23zJ32SJacQ_WXONk,23028
+bayesianflow_for_chem/train.py,sha256=kj6icGqymUUYopDtpre1oE_wpvpeNilbpzgffBsd1tk,9589
+bayesianflow_for_chem/vocab.txt,sha256=HgtAZmpWYk4y8PqEVC4vqut1vE75DfRKE_10s2UW0rU,790
+bayesianflow_for_chem-1.2.4.dist-info/LICENSE,sha256=hIahDEOTzuHCU5J2nd07LWwkLW7Hko4UFO__ffsvB-8,34523
+bayesianflow_for_chem-1.2.4.dist-info/METADATA,sha256=78FGoGjMsdwBavH4rSDtQ_psRYLSUdcg6cdR7KRmgVQ,5890
+bayesianflow_for_chem-1.2.4.dist-info/WHEEL,sha256=In9FTNxeP60KnTkGw7wk6mJPYd_dQSjEZmXdBdMCI-8,91
+bayesianflow_for_chem-1.2.4.dist-info/top_level.txt,sha256=KHsanI3BMCt8D9Qpze2ycrF6nMa3PyojgO6eS1c8kco,22
+bayesianflow_for_chem-1.2.4.dist-info/RECORD,,

bayesianflow_for_chem-1.2.2.dist-info/RECORD DELETED Viewed

@@ -1,12 +0,0 @@
-bayesianflow_for_chem/__init__.py,sha256=sPILW44_x_imRo2kKPMKWQ45C4aNfRQDo1it5Smqqmo,293
-bayesianflow_for_chem/data.py,sha256=9tpRba40lxwrB6aPSJMkxUglEVC3VEQC9wWxhDuz3Q8,7760
-bayesianflow_for_chem/model.py,sha256=CEwqUMahNEcVOZaFjv1JcBokktjW9LspFsYzKjzNmZk,35922
-bayesianflow_for_chem/scorer.py,sha256=mV1vX8aBGFra2BE7N8WHihVIo3dXmUdPQIGfSaiuNdk,4084
-bayesianflow_for_chem/tool.py,sha256=kjR-BUenSjqkwI-TB0QwYXEMy9qdPjL6y4BZVCVfzHA,20237
-bayesianflow_for_chem/train.py,sha256=kj6icGqymUUYopDtpre1oE_wpvpeNilbpzgffBsd1tk,9589
-bayesianflow_for_chem/vocab.txt,sha256=HgtAZmpWYk4y8PqEVC4vqut1vE75DfRKE_10s2UW0rU,790
-bayesianflow_for_chem-1.2.2.dist-info/LICENSE,sha256=hIahDEOTzuHCU5J2nd07LWwkLW7Hko4UFO__ffsvB-8,34523
-bayesianflow_for_chem-1.2.2.dist-info/METADATA,sha256=vRxX8mUrOJJwg_vkgXmla8s2vKhmZAVIYH_N3htAElQ,5890
-bayesianflow_for_chem-1.2.2.dist-info/WHEEL,sha256=In9FTNxeP60KnTkGw7wk6mJPYd_dQSjEZmXdBdMCI-8,91
-bayesianflow_for_chem-1.2.2.dist-info/top_level.txt,sha256=KHsanI3BMCt8D9Qpze2ycrF6nMa3PyojgO6eS1c8kco,22
-bayesianflow_for_chem-1.2.2.dist-info/RECORD,,

{bayesianflow_for_chem-1.2.2.dist-info → bayesianflow_for_chem-1.2.4.dist-info}/LICENSE RENAMED Viewed

File without changes

{bayesianflow_for_chem-1.2.2.dist-info → bayesianflow_for_chem-1.2.4.dist-info}/WHEEL RENAMED Viewed

File without changes

{bayesianflow_for_chem-1.2.2.dist-info → bayesianflow_for_chem-1.2.4.dist-info}/top_level.txt RENAMED Viewed

File without changes

bayesianflow-for-chem 1.2.2__py3-none-any.whl → 1.2.4__py3-none-any.whl

Potentially problematic release.

bayesianflow-for-chem 1.2.2py3-none-any.whl → 1.2.4py3-none-any.whl