PyPI - boltz-vsynthes - Versions diffs - 1.0.0__py3-none-any.whl - Mend

boltz-vsynthes 1.0.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (112) hide show

boltz/__init__.py +7 -0
boltz/data/__init__.py +0 -0
boltz/data/const.py +1184 -0
boltz/data/crop/__init__.py +0 -0
boltz/data/crop/affinity.py +164 -0
boltz/data/crop/boltz.py +296 -0
boltz/data/crop/cropper.py +45 -0
boltz/data/feature/__init__.py +0 -0
boltz/data/feature/featurizer.py +1230 -0
boltz/data/feature/featurizerv2.py +2208 -0
boltz/data/feature/symmetry.py +602 -0
boltz/data/filter/__init__.py +0 -0
boltz/data/filter/dynamic/__init__.py +0 -0
boltz/data/filter/dynamic/date.py +76 -0
boltz/data/filter/dynamic/filter.py +24 -0
boltz/data/filter/dynamic/max_residues.py +37 -0
boltz/data/filter/dynamic/resolution.py +34 -0
boltz/data/filter/dynamic/size.py +38 -0
boltz/data/filter/dynamic/subset.py +42 -0
boltz/data/filter/static/__init__.py +0 -0
boltz/data/filter/static/filter.py +26 -0
boltz/data/filter/static/ligand.py +37 -0
boltz/data/filter/static/polymer.py +299 -0
boltz/data/module/__init__.py +0 -0
boltz/data/module/inference.py +307 -0
boltz/data/module/inferencev2.py +429 -0
boltz/data/module/training.py +684 -0
boltz/data/module/trainingv2.py +660 -0
boltz/data/mol.py +900 -0
boltz/data/msa/__init__.py +0 -0
boltz/data/msa/mmseqs2.py +235 -0
boltz/data/pad.py +84 -0
boltz/data/parse/__init__.py +0 -0
boltz/data/parse/a3m.py +134 -0
boltz/data/parse/csv.py +100 -0
boltz/data/parse/fasta.py +138 -0
boltz/data/parse/mmcif.py +1239 -0
boltz/data/parse/mmcif_with_constraints.py +1607 -0
boltz/data/parse/schema.py +1851 -0
boltz/data/parse/yaml.py +68 -0
boltz/data/sample/__init__.py +0 -0
boltz/data/sample/cluster.py +283 -0
boltz/data/sample/distillation.py +57 -0
boltz/data/sample/random.py +39 -0
boltz/data/sample/sampler.py +49 -0
boltz/data/tokenize/__init__.py +0 -0
boltz/data/tokenize/boltz.py +195 -0
boltz/data/tokenize/boltz2.py +396 -0
boltz/data/tokenize/tokenizer.py +24 -0
boltz/data/types.py +777 -0
boltz/data/write/__init__.py +0 -0
boltz/data/write/mmcif.py +305 -0
boltz/data/write/pdb.py +171 -0
boltz/data/write/utils.py +23 -0
boltz/data/write/writer.py +330 -0
boltz/main.py +1292 -0
boltz/model/__init__.py +0 -0
boltz/model/layers/__init__.py +0 -0
boltz/model/layers/attention.py +132 -0
boltz/model/layers/attentionv2.py +111 -0
boltz/model/layers/confidence_utils.py +231 -0
boltz/model/layers/dropout.py +34 -0
boltz/model/layers/initialize.py +100 -0
boltz/model/layers/outer_product_mean.py +98 -0
boltz/model/layers/pair_averaging.py +135 -0
boltz/model/layers/pairformer.py +337 -0
boltz/model/layers/relative.py +58 -0
boltz/model/layers/transition.py +78 -0
boltz/model/layers/triangular_attention/__init__.py +0 -0
boltz/model/layers/triangular_attention/attention.py +189 -0
boltz/model/layers/triangular_attention/primitives.py +409 -0
boltz/model/layers/triangular_attention/utils.py +380 -0
boltz/model/layers/triangular_mult.py +212 -0
boltz/model/loss/__init__.py +0 -0
boltz/model/loss/bfactor.py +49 -0
boltz/model/loss/confidence.py +590 -0
boltz/model/loss/confidencev2.py +621 -0
boltz/model/loss/diffusion.py +171 -0
boltz/model/loss/diffusionv2.py +134 -0
boltz/model/loss/distogram.py +48 -0
boltz/model/loss/distogramv2.py +105 -0
boltz/model/loss/validation.py +1025 -0
boltz/model/models/__init__.py +0 -0
boltz/model/models/boltz1.py +1286 -0
boltz/model/models/boltz2.py +1249 -0
boltz/model/modules/__init__.py +0 -0
boltz/model/modules/affinity.py +223 -0
boltz/model/modules/confidence.py +481 -0
boltz/model/modules/confidence_utils.py +181 -0
boltz/model/modules/confidencev2.py +495 -0
boltz/model/modules/diffusion.py +844 -0
boltz/model/modules/diffusion_conditioning.py +116 -0
boltz/model/modules/diffusionv2.py +677 -0
boltz/model/modules/encoders.py +639 -0
boltz/model/modules/encodersv2.py +565 -0
boltz/model/modules/transformers.py +322 -0
boltz/model/modules/transformersv2.py +261 -0
boltz/model/modules/trunk.py +688 -0
boltz/model/modules/trunkv2.py +828 -0
boltz/model/modules/utils.py +303 -0
boltz/model/optim/__init__.py +0 -0
boltz/model/optim/ema.py +389 -0
boltz/model/optim/scheduler.py +99 -0
boltz/model/potentials/__init__.py +0 -0
boltz/model/potentials/potentials.py +497 -0
boltz/model/potentials/schedules.py +32 -0
boltz_vsynthes-1.0.0.dist-info/METADATA +151 -0
boltz_vsynthes-1.0.0.dist-info/RECORD +112 -0
boltz_vsynthes-1.0.0.dist-info/WHEEL +5 -0
boltz_vsynthes-1.0.0.dist-info/entry_points.txt +2 -0
boltz_vsynthes-1.0.0.dist-info/licenses/LICENSE +21 -0
boltz_vsynthes-1.0.0.dist-info/top_level.txt +1 -0

boltz/model/modules/__init__.py ADDED Viewed

File without changes

boltz/model/modules/affinity.py ADDED Viewed

@@ -0,0 +1,223 @@
+import torch
+from torch import nn
+import boltz.model.layers.initialize as init
+from boltz.model.layers.pairformer import PairformerNoSeqModule
+from boltz.model.modules.encodersv2 import PairwiseConditioning
+from boltz.model.modules.transformersv2 import DiffusionTransformer
+from boltz.model.modules.utils import LinearNoBias
+class GaussianSmearing(torch.nn.Module):
+    """Gaussian smearing."""
+    def __init__(
+        self,
+        start: float = 0.0,
+        stop: float = 5.0,
+        num_gaussians: int = 50,
+    ) -> None:
+        super().__init__()
+        offset = torch.linspace(start, stop, num_gaussians)
+        self.num_gaussians = num_gaussians
+        self.coeff = -0.5 / (offset[1] - offset[0]).item() ** 2
+        self.register_buffer("offset", offset)
+    def forward(self, dist):
+        shape = dist.shape
+        dist = dist.view(-1, 1) - self.offset.view(1, -1)
+        return torch.exp(self.coeff * torch.pow(dist, 2)).reshape(
+            *shape, self.num_gaussians
+        )
+class AffinityModule(nn.Module):
+    """Algorithm 31"""
+    def __init__(
+        self,
+        token_s,
+        token_z,
+        pairformer_args: dict,
+        transformer_args: dict,
+        num_dist_bins=64,
+        max_dist=22,
+        use_cross_transformer: bool = False,
+        groups: dict = {},
+    ):
+        super().__init__()
+        boundaries = torch.linspace(2, max_dist, num_dist_bins - 1)
+        self.register_buffer("boundaries", boundaries)
+        self.dist_bin_pairwise_embed = nn.Embedding(num_dist_bins, token_z)
+        init.gating_init_(self.dist_bin_pairwise_embed.weight)
+        self.s_to_z_prod_in1 = LinearNoBias(token_s, token_z)
+        self.s_to_z_prod_in2 = LinearNoBias(token_s, token_z)
+        self.z_norm = nn.LayerNorm(token_z)
+        self.z_linear = LinearNoBias(token_z, token_z)
+        self.pairwise_conditioner = PairwiseConditioning(
+            token_z=token_z,
+            dim_token_rel_pos_feats=token_z,
+            num_transitions=2,
+        )
+        self.pairformer_stack = PairformerNoSeqModule(token_z, **pairformer_args)
+        self.affinity_heads = AffinityHeadsTransformer(
+            token_z,
+            transformer_args["token_s"],
+            transformer_args["num_blocks"],
+            transformer_args["num_heads"],
+            transformer_args["activation_checkpointing"],
+            False,
+            groups=groups,
+        )
+    def forward(
+        self,
+        s_inputs,
+        z,
+        x_pred,
+        feats,
+        multiplicity=1,
+        use_kernels=False,
+    ):
+        z = self.z_linear(self.z_norm(z))
+        z = z.repeat_interleave(multiplicity, 0)
+        z = (
+            z
+            + self.s_to_z_prod_in1(s_inputs)[:, :, None, :]
+            + self.s_to_z_prod_in2(s_inputs)[:, None, :, :]
+        )
+        token_to_rep_atom = feats["token_to_rep_atom"]
+        token_to_rep_atom = token_to_rep_atom.repeat_interleave(multiplicity, 0)
+        if len(x_pred.shape) == 4:
+            B, mult, N, _ = x_pred.shape
+            x_pred = x_pred.reshape(B * mult, N, -1)
+        else:
+            BM, N, _ = x_pred.shape
+            B = BM // multiplicity
+            mult = multiplicity
+        x_pred_repr = torch.bmm(token_to_rep_atom.float(), x_pred)
+        d = torch.cdist(x_pred_repr, x_pred_repr)
+        distogram = (d.unsqueeze(-1) > self.boundaries).sum(dim=-1).long()
+        distogram = self.dist_bin_pairwise_embed(distogram)
+        z = z + self.pairwise_conditioner(z_trunk=z, token_rel_pos_feats=distogram)
+        pad_token_mask = feats["token_pad_mask"].repeat_interleave(multiplicity, 0)
+        rec_mask = (feats["mol_type"] == 0).repeat_interleave(multiplicity, 0)
+        rec_mask = rec_mask * pad_token_mask
+        lig_mask = (
+            feats["affinity_token_mask"]
+            .repeat_interleave(multiplicity, 0)
+            .to(torch.bool)
+        )
+        lig_mask = lig_mask * pad_token_mask
+        cross_pair_mask = (
+            lig_mask[:, :, None] * rec_mask[:, None, :]
+            + rec_mask[:, :, None] * lig_mask[:, None, :]
+            + lig_mask[:, :, None] * lig_mask[:, None, :]
+        )
+        z = self.pairformer_stack(
+            z,
+            pair_mask=cross_pair_mask,
+            use_kernels=use_kernels,
+        )
+        out_dict = {}
+        # affinity heads
+        out_dict.update(
+            self.affinity_heads(z=z, feats=feats, multiplicity=multiplicity)
+        )
+        return out_dict
+class AffinityHeadsTransformer(nn.Module):
+    def __init__(
+        self,
+        token_z,
+        input_token_s,
+        num_blocks,
+        num_heads,
+        activation_checkpointing,
+        use_cross_transformer,
+        groups={},
+    ):
+        super().__init__()
+        self.affinity_out_mlp = nn.Sequential(
+            nn.Linear(token_z, token_z),
+            nn.ReLU(),
+            nn.Linear(token_z, input_token_s),
+            nn.ReLU(),
+        )
+        self.to_affinity_pred_value = nn.Sequential(
+            nn.Linear(input_token_s, input_token_s),
+            nn.ReLU(),
+            nn.Linear(input_token_s, input_token_s),
+            nn.ReLU(),
+            nn.Linear(input_token_s, 1),
+        )
+        self.to_affinity_pred_score = nn.Sequential(
+            nn.Linear(input_token_s, input_token_s),
+            nn.ReLU(),
+            nn.Linear(input_token_s, input_token_s),
+            nn.ReLU(),
+            nn.Linear(input_token_s, 1),
+        )
+        self.to_affinity_logits_binary = nn.Linear(1, 1)
+    def forward(
+        self,
+        z,
+        feats,
+        multiplicity=1,
+    ):
+        pad_token_mask = (
+            feats["token_pad_mask"].repeat_interleave(multiplicity, 0).unsqueeze(-1)
+        )
+        rec_mask = (
+            (feats["mol_type"] == 0).repeat_interleave(multiplicity, 0).unsqueeze(-1)
+        )
+        rec_mask = rec_mask * pad_token_mask
+        lig_mask = (
+            feats["affinity_token_mask"]
+            .repeat_interleave(multiplicity, 0)
+            .to(torch.bool)
+            .unsqueeze(-1)
+        ) * pad_token_mask
+        cross_pair_mask = (
+            lig_mask[:, :, None] * rec_mask[:, None, :]
+            + rec_mask[:, :, None] * lig_mask[:, None, :]
+            + (lig_mask[:, :, None] * lig_mask[:, None, :])
+        ) * (
+            1
+            - torch.eye(lig_mask.shape[1], device=lig_mask.device)
+            .unsqueeze(-1)
+            .unsqueeze(0)
+        )
+        g = torch.sum(z * cross_pair_mask, dim=(1, 2)) / (
+            torch.sum(cross_pair_mask, dim=(1, 2)) + 1e-7
+        )
+        g = self.affinity_out_mlp(g)
+        affinity_pred_value = self.to_affinity_pred_value(g).reshape(-1, 1)
+        affinity_pred_score = self.to_affinity_pred_score(g).reshape(-1, 1)
+        affinity_logits_binary = self.to_affinity_logits_binary(
+            affinity_pred_score
+        ).reshape(-1, 1)
+        out_dict = {
+            "affinity_pred_value": affinity_pred_value,
+            "affinity_logits_binary": affinity_logits_binary,
+        }
+        return out_dict

boltz/model/modules/confidence.py ADDED Viewed

@@ -0,0 +1,481 @@
+import torch
+import torch.nn.functional as F
+from torch import nn
+import boltz.model.layers.initialize as init
+from boltz.data import const
+from boltz.model.modules.confidence_utils import (
+    compute_aggregated_metric,
+    compute_ptms,
+)
+from boltz.model.modules.encoders import RelativePositionEncoder
+from boltz.model.modules.trunk import (
+    InputEmbedder,
+    MSAModule,
+    PairformerModule,
+)
+from boltz.model.modules.utils import LinearNoBias
+class ConfidenceModule(nn.Module):
+    """Confidence module."""
+    def __init__(
+        self,
+        token_s,
+        token_z,
+        pairformer_args: dict,
+        num_dist_bins=64,
+        max_dist=22,
+        add_s_to_z_prod=False,
+        add_s_input_to_s=False,
+        use_s_diffusion=False,
+        add_z_input_to_z=False,
+        confidence_args: dict = None,
+        compute_pae: bool = False,
+        imitate_trunk=False,
+        full_embedder_args: dict = None,
+        msa_args: dict = None,
+        compile_pairformer=False,
+    ):
+        """Initialize the confidence module.
+        Parameters
+        ----------
+        token_s : int
+            The single representation dimension.
+        token_z : int
+            The pair representation dimension.
+        pairformer_args : int
+            The pairformer arguments.
+        num_dist_bins : int, optional
+            The number of distance bins, by default 64.
+        max_dist : int, optional
+            The maximum distance, by default 22.
+        add_s_to_z_prod : bool, optional
+            Whether to add s to z product, by default False.
+        add_s_input_to_s : bool, optional
+            Whether to add s input to s, by default False.
+        use_s_diffusion : bool, optional
+            Whether to use s diffusion, by default False.
+        add_z_input_to_z : bool, optional
+            Whether to add z input to z, by default False.
+        confidence_args : dict, optional
+            The confidence arguments, by default None.
+        compute_pae : bool, optional
+            Whether to compute pae, by default False.
+        imitate_trunk : bool, optional
+            Whether to imitate trunk, by default False.
+        full_embedder_args : dict, optional
+            The full embedder arguments, by default None.
+        msa_args : dict, optional
+            The msa arguments, by default None.
+        compile_pairformer : bool, optional
+            Whether to compile pairformer, by default False.
+        """
+        super().__init__()
+        self.max_num_atoms_per_token = 23
+        self.no_update_s = pairformer_args.get("no_update_s", False)
+        boundaries = torch.linspace(2, max_dist, num_dist_bins - 1)
+        self.register_buffer("boundaries", boundaries)
+        self.dist_bin_pairwise_embed = nn.Embedding(num_dist_bins, token_z)
+        init.gating_init_(self.dist_bin_pairwise_embed.weight)
+        s_input_dim = (
+            token_s + 2 * const.num_tokens + 1 + len(const.pocket_contact_info)
+        )
+        self.use_s_diffusion = use_s_diffusion
+        if use_s_diffusion:
+            self.s_diffusion_norm = nn.LayerNorm(2 * token_s)
+            self.s_diffusion_to_s = LinearNoBias(2 * token_s, token_s)
+            init.gating_init_(self.s_diffusion_to_s.weight)
+        self.s_to_z = LinearNoBias(s_input_dim, token_z)
+        self.s_to_z_transpose = LinearNoBias(s_input_dim, token_z)
+        init.gating_init_(self.s_to_z.weight)
+        init.gating_init_(self.s_to_z_transpose.weight)
+        self.add_s_to_z_prod = add_s_to_z_prod
+        if add_s_to_z_prod:
+            self.s_to_z_prod_in1 = LinearNoBias(s_input_dim, token_z)
+            self.s_to_z_prod_in2 = LinearNoBias(s_input_dim, token_z)
+            self.s_to_z_prod_out = LinearNoBias(token_z, token_z)
+            init.gating_init_(self.s_to_z_prod_out.weight)
+        self.imitate_trunk = imitate_trunk
+        if self.imitate_trunk:
+            s_input_dim = (
+                token_s + 2 * const.num_tokens + 1 + len(const.pocket_contact_info)
+            )
+            self.s_init = nn.Linear(s_input_dim, token_s, bias=False)
+            self.z_init_1 = nn.Linear(s_input_dim, token_z, bias=False)
+            self.z_init_2 = nn.Linear(s_input_dim, token_z, bias=False)
+            # Input embeddings
+            self.input_embedder = InputEmbedder(**full_embedder_args)
+            self.rel_pos = RelativePositionEncoder(token_z)
+            self.token_bonds = nn.Linear(1, token_z, bias=False)
+            # Normalization layers
+            self.s_norm = nn.LayerNorm(token_s)
+            self.z_norm = nn.LayerNorm(token_z)
+            # Recycling projections
+            self.s_recycle = nn.Linear(token_s, token_s, bias=False)
+            self.z_recycle = nn.Linear(token_z, token_z, bias=False)
+            init.gating_init_(self.s_recycle.weight)
+            init.gating_init_(self.z_recycle.weight)
+            # Pairwise stack
+            self.msa_module = MSAModule(
+                token_z=token_z,
+                s_input_dim=s_input_dim,
+                **msa_args,
+            )
+            self.pairformer_module = PairformerModule(
+                token_s,
+                token_z,
+                **pairformer_args,
+            )
+            if compile_pairformer:
+                # Big models hit the default cache limit (8)
+                self.is_pairformer_compiled = True
+                torch._dynamo.config.cache_size_limit = 512
+                torch._dynamo.config.accumulated_cache_size_limit = 512
+                self.pairformer_module = torch.compile(
+                    self.pairformer_module,
+                    dynamic=False,
+                    fullgraph=False,
+                )
+            self.final_s_norm = nn.LayerNorm(token_s)
+            self.final_z_norm = nn.LayerNorm(token_z)
+        else:
+            self.s_inputs_norm = nn.LayerNorm(s_input_dim)
+            if not self.no_update_s:
+                self.s_norm = nn.LayerNorm(token_s)
+            self.z_norm = nn.LayerNorm(token_z)
+            self.add_s_input_to_s = add_s_input_to_s
+            if add_s_input_to_s:
+                self.s_input_to_s = LinearNoBias(s_input_dim, token_s)
+                init.gating_init_(self.s_input_to_s.weight)
+            self.add_z_input_to_z = add_z_input_to_z
+            if add_z_input_to_z:
+                self.rel_pos = RelativePositionEncoder(token_z)
+                self.token_bonds = nn.Linear(1, token_z, bias=False)
+            self.pairformer_stack = PairformerModule(
+                token_s,
+                token_z,
+                **pairformer_args,
+            )
+        self.confidence_heads = ConfidenceHeads(
+            token_s,
+            token_z,
+            compute_pae=compute_pae,
+            **confidence_args,
+        )
+    def forward(
+        self,
+        s_inputs,
+        s,
+        z,
+        x_pred,
+        feats,
+        pred_distogram_logits,
+        multiplicity=1,
+        s_diffusion=None,
+        run_sequentially=False,
+        use_kernels: bool = False,
+    ):
+        if run_sequentially and multiplicity > 1:
+            assert z.shape[0] == 1, "Not supported with batch size > 1"
+            out_dicts = []
+            for sample_idx in range(multiplicity):
+                out_dicts.append(  # noqa: PERF401
+                    self.forward(
+                        s_inputs,
+                        s,
+                        z,
+                        x_pred[sample_idx : sample_idx + 1],
+                        feats,
+                        pred_distogram_logits,
+                        multiplicity=1,
+                        s_diffusion=s_diffusion[sample_idx : sample_idx + 1]
+                        if s_diffusion is not None
+                        else None,
+                        run_sequentially=False,
+                        use_kernels=use_kernels,
+                    )
+                )
+            out_dict = {}
+            for key in out_dicts[0]:
+                if key != "pair_chains_iptm":
+                    out_dict[key] = torch.cat([out[key] for out in out_dicts], dim=0)
+                else:
+                    pair_chains_iptm = {}
+                    for chain_idx1 in out_dicts[0][key].keys():
+                        chains_iptm = {}
+                        for chain_idx2 in out_dicts[0][key][chain_idx1].keys():
+                            chains_iptm[chain_idx2] = torch.cat(
+                                [out[key][chain_idx1][chain_idx2] for out in out_dicts],
+                                dim=0,
+                            )
+                        pair_chains_iptm[chain_idx1] = chains_iptm
+                    out_dict[key] = pair_chains_iptm
+            return out_dict
+        if self.imitate_trunk:
+            s_inputs = self.input_embedder(feats)
+            # Initialize the sequence and pairwise embeddings
+            s_init = self.s_init(s_inputs)
+            z_init = (
+                self.z_init_1(s_inputs)[:, :, None]
+                + self.z_init_2(s_inputs)[:, None, :]
+            )
+            relative_position_encoding = self.rel_pos(feats)
+            z_init = z_init + relative_position_encoding
+            z_init = z_init + self.token_bonds(feats["token_bonds"].float())
+            # Apply recycling
+            s = s_init + self.s_recycle(self.s_norm(s))
+            z = z_init + self.z_recycle(self.z_norm(z))
+        else:
+            s_inputs = self.s_inputs_norm(s_inputs).repeat_interleave(multiplicity, 0)
+            if not self.no_update_s:
+                s = self.s_norm(s)
+            if self.add_s_input_to_s:
+                s = s + self.s_input_to_s(s_inputs)
+            z = self.z_norm(z)
+            if self.add_z_input_to_z:
+                relative_position_encoding = self.rel_pos(feats)
+                z = z + relative_position_encoding
+                z = z + self.token_bonds(feats["token_bonds"].float())
+        s = s.repeat_interleave(multiplicity, 0)
+        if self.use_s_diffusion:
+            assert s_diffusion is not None
+            s_diffusion = self.s_diffusion_norm(s_diffusion)
+            s = s + self.s_diffusion_to_s(s_diffusion)
+        z = z.repeat_interleave(multiplicity, 0)
+        z = (
+            z
+            + self.s_to_z(s_inputs)[:, :, None, :]
+            + self.s_to_z_transpose(s_inputs)[:, None, :, :]
+        )
+        if self.add_s_to_z_prod:
+            z = z + self.s_to_z_prod_out(
+                self.s_to_z_prod_in1(s_inputs)[:, :, None, :]
+                * self.s_to_z_prod_in2(s_inputs)[:, None, :, :]
+            )
+        token_to_rep_atom = feats["token_to_rep_atom"]
+        token_to_rep_atom = token_to_rep_atom.repeat_interleave(multiplicity, 0)
+        if len(x_pred.shape) == 4:
+            B, mult, N, _ = x_pred.shape
+            x_pred = x_pred.reshape(B * mult, N, -1)
+        x_pred_repr = torch.bmm(token_to_rep_atom.float(), x_pred)
+        d = torch.cdist(x_pred_repr, x_pred_repr)
+        distogram = (d.unsqueeze(-1) > self.boundaries).sum(dim=-1).long()
+        distogram = self.dist_bin_pairwise_embed(distogram)
+        z = z + distogram
+        mask = feats["token_pad_mask"].repeat_interleave(multiplicity, 0)
+        pair_mask = mask[:, :, None] * mask[:, None, :]
+        if self.imitate_trunk:
+            z = z + self.msa_module(z, s_inputs, feats, use_kernels=use_kernels)
+            s, z = self.pairformer_module(
+                s, z, mask=mask, pair_mask=pair_mask, use_kernels=use_kernels
+            )
+            s, z = self.final_s_norm(s), self.final_z_norm(z)
+        else:
+            s_t, z_t = self.pairformer_stack(
+                s, z, mask=mask, pair_mask=pair_mask, use_kernels=use_kernels
+            )
+            # AF3 has residual connections, we remove them
+            s = s_t
+            z = z_t
+        out_dict = {}
+        # confidence heads
+        out_dict.update(
+            self.confidence_heads(
+                s=s,
+                z=z,
+                x_pred=x_pred,
+                d=d,
+                feats=feats,
+                multiplicity=multiplicity,
+                pred_distogram_logits=pred_distogram_logits,
+            )
+        )
+        return out_dict
+class ConfidenceHeads(nn.Module):
+    """Confidence heads."""
+    def __init__(
+        self,
+        token_s,
+        token_z,
+        num_plddt_bins=50,
+        num_pde_bins=64,
+        num_pae_bins=64,
+        compute_pae: bool = True,
+    ):
+        """Initialize the confidence head.
+        Parameters
+        ----------
+        token_s : int
+            The single representation dimension.
+        token_z : int
+            The pair representation dimension.
+        num_plddt_bins : int
+            The number of plddt bins, by default 50.
+        num_pde_bins : int
+            The number of pde bins, by default 64.
+        num_pae_bins : int
+            The number of pae bins, by default 64.
+        compute_pae : bool
+            Whether to compute pae, by default False
+        """
+        super().__init__()
+        self.max_num_atoms_per_token = 23
+        self.to_pde_logits = LinearNoBias(token_z, num_pde_bins)
+        self.to_plddt_logits = LinearNoBias(token_s, num_plddt_bins)
+        self.to_resolved_logits = LinearNoBias(token_s, 2)
+        self.compute_pae = compute_pae
+        if self.compute_pae:
+            self.to_pae_logits = LinearNoBias(token_z, num_pae_bins)
+    def forward(
+        self,
+        s,
+        z,
+        x_pred,
+        d,
+        feats,
+        pred_distogram_logits,
+        multiplicity=1,
+    ):
+        # Compute the pLDDT, PDE, PAE, and resolved logits
+        plddt_logits = self.to_plddt_logits(s)
+        pde_logits = self.to_pde_logits(z + z.transpose(1, 2))
+        resolved_logits = self.to_resolved_logits(s)
+        if self.compute_pae:
+            pae_logits = self.to_pae_logits(z)
+        # Weights used to compute the interface pLDDT
+        ligand_weight = 2
+        interface_weight = 1
+        # Retrieve relevant features
+        token_type = feats["mol_type"]
+        token_type = token_type.repeat_interleave(multiplicity, 0)
+        is_ligand_token = (token_type == const.chain_type_ids["NONPOLYMER"]).float()
+        # Compute the aggregated pLDDT and iPLDDT
+        plddt = compute_aggregated_metric(plddt_logits)
+        token_pad_mask = feats["token_pad_mask"].repeat_interleave(multiplicity, 0)
+        complex_plddt = (plddt * token_pad_mask).sum(dim=-1) / token_pad_mask.sum(
+            dim=-1
+        )
+        is_contact = (d < 8).float()
+        is_different_chain = (
+            feats["asym_id"].unsqueeze(-1) != feats["asym_id"].unsqueeze(-2)
+        ).float()
+        is_different_chain = is_different_chain.repeat_interleave(multiplicity, 0)
+        token_interface_mask = torch.max(
+            is_contact * is_different_chain * (1 - is_ligand_token).unsqueeze(-1),
+            dim=-1,
+        ).values
+        iplddt_weight = (
+            is_ligand_token * ligand_weight + token_interface_mask * interface_weight
+        )
+        complex_iplddt = (plddt * token_pad_mask * iplddt_weight).sum(dim=-1) / (
+            torch.sum(token_pad_mask * iplddt_weight, dim=-1) + 1e-5
+        )
+        # Compute the aggregated PDE and iPDE
+        pde = compute_aggregated_metric(pde_logits, end=32)
+        pred_distogram_prob = nn.functional.softmax(
+            pred_distogram_logits, dim=-1
+        ).repeat_interleave(multiplicity, 0)
+        contacts = torch.zeros((1, 1, 1, 64), dtype=pred_distogram_prob.dtype).to(
+            pred_distogram_prob.device
+        )
+        contacts[:, :, :, :20] = 1.0
+        prob_contact = (pred_distogram_prob * contacts).sum(-1)
+        token_pad_mask = feats["token_pad_mask"].repeat_interleave(multiplicity, 0)
+        token_pad_pair_mask = (
+            token_pad_mask.unsqueeze(-1)
+            * token_pad_mask.unsqueeze(-2)
+            * (
+                1
+                - torch.eye(
+                    token_pad_mask.shape[1], device=token_pad_mask.device
+                ).unsqueeze(0)
+            )
+        )
+        token_pair_mask = token_pad_pair_mask * prob_contact
+        complex_pde = (pde * token_pair_mask).sum(dim=(1, 2)) / token_pair_mask.sum(
+            dim=(1, 2)
+        )
+        asym_id = feats["asym_id"].repeat_interleave(multiplicity, 0)
+        token_interface_pair_mask = token_pair_mask * (
+            asym_id.unsqueeze(-1) != asym_id.unsqueeze(-2)
+        )
+        complex_ipde = (pde * token_interface_pair_mask).sum(dim=(1, 2)) / (
+            token_interface_pair_mask.sum(dim=(1, 2)) + 1e-5
+        )
+        out_dict = dict(
+            pde_logits=pde_logits,
+            plddt_logits=plddt_logits,
+            resolved_logits=resolved_logits,
+            pde=pde,
+            plddt=plddt,
+            complex_plddt=complex_plddt,
+            complex_iplddt=complex_iplddt,
+            complex_pde=complex_pde,
+            complex_ipde=complex_ipde,
+        )
+        if self.compute_pae:
+            out_dict["pae_logits"] = pae_logits
+            out_dict["pae"] = compute_aggregated_metric(pae_logits, end=32)
+            ptm, iptm, ligand_iptm, protein_iptm, pair_chains_iptm = compute_ptms(
+                pae_logits, x_pred, feats, multiplicity
+            )
+            out_dict["ptm"] = ptm
+            out_dict["iptm"] = iptm
+            out_dict["ligand_iptm"] = ligand_iptm
+            out_dict["protein_iptm"] = protein_iptm
+            out_dict["pair_chains_iptm"] = pair_chains_iptm
+        return out_dict