PyPI - rc-foundry - Versions diffs - 0.1.1__py3-none-any.whl - Mend

rc-foundry 0.1.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (180) hide show

foundry/__init__.py +57 -0
foundry/callbacks/__init__.py +5 -0
foundry/callbacks/callback.py +116 -0
foundry/callbacks/health_logging.py +419 -0
foundry/callbacks/metrics_logging.py +211 -0
foundry/callbacks/timing_logging.py +67 -0
foundry/callbacks/train_logging.py +278 -0
foundry/common.py +108 -0
foundry/constants.py +28 -0
foundry/hydra/resolvers.py +77 -0
foundry/inference_engines/base.py +235 -0
foundry/inference_engines/checkpoint_registry.py +66 -0
foundry/metrics/__init__.py +12 -0
foundry/metrics/losses.py +30 -0
foundry/metrics/metric.py +319 -0
foundry/model/layers/blocks.py +47 -0
foundry/testing/__init__.py +6 -0
foundry/testing/fixtures.py +19 -0
foundry/testing/pytest_hooks.py +15 -0
foundry/trainers/fabric.py +923 -0
foundry/training/EMA.py +67 -0
foundry/training/checkpoint.py +61 -0
foundry/training/schedulers.py +91 -0
foundry/utils/alignment.py +86 -0
foundry/utils/components.py +415 -0
foundry/utils/datasets.py +405 -0
foundry/utils/ddp.py +103 -0
foundry/utils/instantiators.py +72 -0
foundry/utils/logging.py +279 -0
foundry/utils/rigid.py +1460 -0
foundry/utils/rotation_augmentation.py +65 -0
foundry/utils/squashfs.py +172 -0
foundry/utils/torch.py +317 -0
foundry/utils/weights.py +271 -0
foundry/version.py +34 -0
foundry_cli/__init__.py +3 -0
foundry_cli/download_checkpoints.py +281 -0
mpnn/__init__.py +1 -0
mpnn/collate/feature_collator.py +265 -0
mpnn/inference.py +53 -0
mpnn/inference_engines/mpnn.py +549 -0
mpnn/loss/nll_loss.py +122 -0
mpnn/metrics/nll.py +369 -0
mpnn/metrics/sequence_recovery.py +440 -0
mpnn/model/layers/graph_embeddings.py +2372 -0
mpnn/model/layers/message_passing.py +332 -0
mpnn/model/layers/position_wise_feed_forward.py +44 -0
mpnn/model/layers/positional_encoding.py +98 -0
mpnn/model/mpnn.py +2632 -0
mpnn/pipelines/mpnn.py +162 -0
mpnn/samplers/samplers.py +167 -0
mpnn/train.py +341 -0
mpnn/trainers/mpnn.py +193 -0
mpnn/transforms/feature_aggregation/mpnn.py +184 -0
mpnn/transforms/feature_aggregation/polymer_ligand_interface.py +76 -0
mpnn/transforms/feature_aggregation/token_encodings.py +132 -0
mpnn/transforms/feature_aggregation/user_settings.py +347 -0
mpnn/transforms/polymer_ligand_interface.py +164 -0
mpnn/utils/inference.py +2397 -0
mpnn/utils/probability.py +37 -0
mpnn/utils/weights.py +309 -0
rc_foundry-0.1.1.dist-info/METADATA +239 -0
rc_foundry-0.1.1.dist-info/RECORD +180 -0
rc_foundry-0.1.1.dist-info/WHEEL +4 -0
rc_foundry-0.1.1.dist-info/entry_points.txt +5 -0
rc_foundry-0.1.1.dist-info/licenses/LICENSE.md +28 -0
rf3/__init__.py +3 -0
rf3/_version.py +33 -0
rf3/alignment.py +79 -0
rf3/callbacks/dump_validation_structures.py +101 -0
rf3/callbacks/metrics_logging.py +324 -0
rf3/chemical.py +1529 -0
rf3/cli.py +77 -0
rf3/data/cyclic_transform.py +78 -0
rf3/data/extra_xforms.py +36 -0
rf3/data/ground_truth_template.py +463 -0
rf3/data/paired_msa.py +206 -0
rf3/data/pipeline_utils.py +128 -0
rf3/data/pipelines.py +558 -0
rf3/diffusion_samplers/inference_sampler.py +222 -0
rf3/inference.py +65 -0
rf3/inference_engines/__init__.py +5 -0
rf3/inference_engines/rf3.py +735 -0
rf3/kinematics.py +354 -0
rf3/loss/af3_confidence_loss.py +515 -0
rf3/loss/af3_losses.py +655 -0
rf3/loss/loss.py +179 -0
rf3/metrics/chiral.py +179 -0
rf3/metrics/clashing_chains.py +68 -0
rf3/metrics/distogram.py +421 -0
rf3/metrics/lddt.py +523 -0
rf3/metrics/metadata.py +43 -0
rf3/metrics/metric_utils.py +192 -0
rf3/metrics/predicted_error.py +134 -0
rf3/metrics/rasa.py +108 -0
rf3/metrics/selected_distances.py +91 -0
rf3/model/RF3.py +527 -0
rf3/model/RF3_blocks.py +92 -0
rf3/model/RF3_structure.py +303 -0
rf3/model/layers/af3_auxiliary_heads.py +255 -0
rf3/model/layers/af3_diffusion_transformer.py +544 -0
rf3/model/layers/attention.py +313 -0
rf3/model/layers/layer_utils.py +127 -0
rf3/model/layers/mlff.py +118 -0
rf3/model/layers/outer_product.py +59 -0
rf3/model/layers/pairformer_layers.py +783 -0
rf3/model/layers/structure_bias.py +56 -0
rf3/scoring.py +1787 -0
rf3/symmetry/resolve.py +284 -0
rf3/train.py +194 -0
rf3/trainers/rf3.py +570 -0
rf3/util_module.py +47 -0
rf3/utils/frames.py +109 -0
rf3/utils/inference.py +665 -0
rf3/utils/io.py +198 -0
rf3/utils/loss.py +72 -0
rf3/utils/predict_and_score.py +165 -0
rf3/utils/predicted_error.py +673 -0
rf3/utils/recycling.py +42 -0
rf3/validate.py +140 -0
rfd3/.gitignore +7 -0
rfd3/Makefile +76 -0
rfd3/__init__.py +12 -0
rfd3/callbacks.py +66 -0
rfd3/cli.py +41 -0
rfd3/constants.py +212 -0
rfd3/engine.py +543 -0
rfd3/inference/datasets.py +193 -0
rfd3/inference/input_parsing.py +1123 -0
rfd3/inference/legacy_input_parsing.py +717 -0
rfd3/inference/parsing.py +165 -0
rfd3/inference/symmetry/atom_array.py +298 -0
rfd3/inference/symmetry/checks.py +241 -0
rfd3/inference/symmetry/contigs.py +63 -0
rfd3/inference/symmetry/frames.py +355 -0
rfd3/inference/symmetry/symmetry_utils.py +398 -0
rfd3/metrics/design_metrics.py +465 -0
rfd3/metrics/hbonds_hbplus_metrics.py +308 -0
rfd3/metrics/hbonds_metrics.py +389 -0
rfd3/metrics/losses.py +325 -0
rfd3/metrics/metrics_utils.py +118 -0
rfd3/metrics/sidechain_metrics.py +349 -0
rfd3/model/RFD3.py +105 -0
rfd3/model/RFD3_diffusion_module.py +387 -0
rfd3/model/cfg_utils.py +81 -0
rfd3/model/inference_sampler.py +635 -0
rfd3/model/layers/attention.py +577 -0
rfd3/model/layers/block_utils.py +580 -0
rfd3/model/layers/blocks.py +777 -0
rfd3/model/layers/chunked_pairwise.py +377 -0
rfd3/model/layers/encoders.py +417 -0
rfd3/model/layers/layer_utils.py +197 -0
rfd3/model/layers/pairformer_layers.py +128 -0
rfd3/run_inference.py +45 -0
rfd3/testing/debug.py +139 -0
rfd3/testing/debug_utils.py +73 -0
rfd3/testing/testing_utils.py +356 -0
rfd3/train.py +194 -0
rfd3/trainer/dump_validation_structures.py +154 -0
rfd3/trainer/fabric_trainer.py +923 -0
rfd3/trainer/recycling.py +42 -0
rfd3/trainer/rfd3.py +485 -0
rfd3/trainer/trainer_utils.py +502 -0
rfd3/transforms/conditioning_base.py +508 -0
rfd3/transforms/conditioning_utils.py +200 -0
rfd3/transforms/design_transforms.py +807 -0
rfd3/transforms/dna_crop.py +523 -0
rfd3/transforms/hbonds.py +407 -0
rfd3/transforms/hbonds_hbplus.py +246 -0
rfd3/transforms/ncaa_transforms.py +153 -0
rfd3/transforms/pipelines.py +632 -0
rfd3/transforms/ppi_transforms.py +541 -0
rfd3/transforms/rasa.py +116 -0
rfd3/transforms/symmetry.py +76 -0
rfd3/transforms/training_conditions.py +552 -0
rfd3/transforms/util_transforms.py +498 -0
rfd3/transforms/virtual_atoms.py +305 -0
rfd3/utils/inference.py +648 -0
rfd3/utils/io.py +245 -0
rfd3/utils/vizualize.py +276 -0

rf3/utils/predicted_error.py ADDED Viewed

@@ -0,0 +1,673 @@
+import itertools
+from typing import List
+import einops
+import numpy as np
+import pandas as pd
+import torch
+import tree
+from beartype.typing import Any
+from biotite.structure import AtomArray, AtomArrayStack
+from omegaconf import DictConfig
+from rf3.chemical import NHEAVY
+from rf3.metrics.metric_utils import (
+    compute_mean_over_subsampled_pairs,
+    compute_min_over_subsampled_pairs,
+    create_chainwise_masks_1d,
+    create_chainwise_masks_2d,
+    create_interface_masks_2d,
+    spread_batch_into_dictionary,
+    unbin_logits,
+)
+def get_mean_atomwise_plddt(
+    plddt_logits: torch.Tensor,
+    is_real_atom: torch.Tensor,
+    max_value: float,
+) -> torch.Tensor:
+    """Aggregate plddts.
+    Args:
+        plddt_logits: Tensor of shape [B, n_token, max_atoms_in_a_token * n_bin] with logits
+        is_real_atom: Boolean mask of shape [B, n_token, max_atoms_in_a_token] indicating which atoms are real (i.e., not padding)
+        max_value: Maximum value for pLDDT (assigned to the last bin)
+    Returns:
+        plddt: Tensor of shape [B,] with the mean atom-wise pLDDT for each batch
+    """
+    assert (
+        plddt_logits.ndim == 3
+    ), "plddt_logits must be a 3D tensor (B, n_token, max_atoms_in_a_token * n_bins)"
+    # TODO: Replace with the last dimension of is_real_atom; right now that number is too large (36) because it includes hydrogens
+    max_atoms_in_a_token = NHEAVY
+    # Since the pLDDT logits have the last dimension (max_atoms_in_a_token * n_bins), we can calculate n_bins directly
+    assert (
+        plddt_logits.shape[-1] % max_atoms_in_a_token == 0
+    ), "The last dimension of plddt_logits must be divisible by max_atoms_in_a_token!"
+    n_bins = plddt_logits.shape[-1] // max_atoms_in_a_token
+    # ... reshape to match what unbin_logits expects
+    reshaped_plddt_logits = einops.rearrange(
+        plddt_logits,
+        "... n_token (max_atoms_in_a_token n_bins) -> ... n_bins n_token max_atoms_in_a_token",
+        max_atoms_in_a_token=max_atoms_in_a_token,
+        n_bins=n_bins,
+    ).float()  # [..., n_token, n_bins * max_atoms_in_a_token] -> [ ..., n_bins, n_token, max_atoms_in_a_token]
+    plddt = unbin_logits(
+        reshaped_plddt_logits,
+        max_value,
+        n_bins,
+    )
+    is_real_atom = is_real_atom.to(device=plddt.device)
+    #  ... create mask indicating which atoms are "real" (i.e., not padding) and calculate the mean
+    mask = is_real_atom[:, :max_atoms_in_a_token].unsqueeze(0)
+    atomwise_plddt_mean = (plddt * mask).sum(dim=(1, 2)) / mask.sum(dim=(1, 2))
+    return atomwise_plddt_mean
+def compile_af3_confidence_outputs(
+    plddt_logits: torch.Tensor,
+    pae_logits: torch.Tensor,
+    pde_logits: torch.Tensor,
+    chain_iid_token_lvl: torch.Tensor,
+    is_real_atom: torch.Tensor,
+    example_id: str,
+    confidence_loss_cfg: DictConfig | dict,
+) -> dict[str, Any]:
+    # TODO: Refactor to accept an AtomArray
+    # TODO: Taking the confidence_loss_cfg does not align with functional programming best-practices; we should instead take  the max_value and n_bins as arguments
+    """Given the confidence logits, computes the confidence metrics for the model's predictions.
+    Returns:
+        dict[str, Any]: A dictionary containing the following:
+            - confidence_df: A DataFrame containing the aggregate confidence metrics at the chain- and interface-level
+            - plddt: The pLDDT logits
+            - pae: The pAE logits
+            - pde: The pDE logits
+    """
+    # Reorder the input tensors to be in (B, n_bins, ...) format for unbinning
+    plddt = unbin_logits(
+        plddt_logits.reshape(
+            -1,
+            plddt_logits.shape[1],
+            NHEAVY,
+            confidence_loss_cfg.plddt.n_bins,
+        )
+        .permute(0, 3, 1, 2)
+        .float(),
+        confidence_loss_cfg.plddt.max_value,
+        confidence_loss_cfg.plddt.n_bins,
+    )
+    # Unbin the pae and pde logits
+    pae = unbin_logits(
+        pae_logits.permute(0, 3, 1, 2).float(),
+        confidence_loss_cfg.pae.max_value,
+        confidence_loss_cfg.pae.n_bins,
+    )
+    pde = unbin_logits(
+        pde_logits.permute(0, 3, 1, 2).float(),
+        confidence_loss_cfg.pde.max_value,
+        confidence_loss_cfg.pde.n_bins,
+    )
+    # Calculate interface metrics
+    interface_masks = create_interface_masks_2d(chain_iid_token_lvl, device=pae.device)
+    pae_interface = {
+        k: spread_batch_into_dictionary(compute_mean_over_subsampled_pairs(pae, v))
+        for k, v in interface_masks.items()
+    }
+    pde_interface = {
+        k: spread_batch_into_dictionary(compute_mean_over_subsampled_pairs(pde, v))
+        for k, v in interface_masks.items()
+    }
+    pae_interface_min = {
+        k: spread_batch_into_dictionary(compute_min_over_subsampled_pairs(pae, v))
+        for k, v in interface_masks.items()
+    }
+    pde_interface_min = {
+        k: spread_batch_into_dictionary(compute_min_over_subsampled_pairs(pde, v))
+        for k, v in interface_masks.items()
+    }
+    # Calculate chainwise metrics
+    chain_masks_2d = create_chainwise_masks_2d(chain_iid_token_lvl, device=pae.device)
+    pae_chainwise = {
+        k: spread_batch_into_dictionary(compute_mean_over_subsampled_pairs(pae, v))
+        for k, v in chain_masks_2d.items()
+    }
+    pde_chainwise = {
+        k: spread_batch_into_dictionary(compute_mean_over_subsampled_pairs(pde, v))
+        for k, v in chain_masks_2d.items()
+    }
+    chain_masks_1d = create_chainwise_masks_1d(
+        chain_iid_token_lvl, device=is_real_atom.device
+    )
+    plddt_chainwise = {
+        k: spread_batch_into_dictionary(
+            compute_mean_over_subsampled_pairs(
+                plddt, is_real_atom[..., :NHEAVY] * v[:, None]
+            )
+        )
+        for k, v in chain_masks_1d.items()
+    }
+    # Aggregate confidence data
+    confidence_data = {
+        "example_id": example_id,
+        "mean_plddt": spread_batch_into_dictionary(
+            compute_mean_over_subsampled_pairs(plddt, is_real_atom[..., :NHEAVY])
+        ),
+        "mean_pae": spread_batch_into_dictionary(pae.mean(dim=(-1, -2))),
+        "mean_pde": spread_batch_into_dictionary(pde.mean(dim=(-1, -2))),
+        "chain_wise_mean_plddt": plddt_chainwise,
+        "chain_wise_mean_pae": pae_chainwise,
+        "chain_wise_mean_pde": pde_chainwise,
+        "interface_wise_mean_pae": pae_interface,
+        "interface_wise_mean_pde": pde_interface,
+        "interface_wise_min_pae": pae_interface_min,
+        "interface_wise_min_pde": pde_interface_min,
+    }
+    # Generate DataFrame rows
+    num_batches = plddt.shape[0]
+    chains = np.unique(chain_iid_token_lvl)
+    chain_pairs = list(itertools.combinations(chains, 2))
+    # For every batch, chain, and interface (chain pair), generate a dataframe row
+    chain_rows = [
+        {
+            "example_id": example_id,
+            "chain_chainwise": chain,
+            "chainwise_plddt": confidence_data["chain_wise_mean_plddt"][chain][
+                batch_idx
+            ],
+            "chainwise_pde": confidence_data["chain_wise_mean_pde"][chain][batch_idx],
+            "chainwise_pae": confidence_data["chain_wise_mean_pae"][chain][batch_idx],
+            "overall_plddt": confidence_data["mean_plddt"][batch_idx],
+            "overall_pde": confidence_data["mean_pde"][batch_idx],
+            "overall_pae": confidence_data["mean_pae"][batch_idx],
+            "batch_idx": batch_idx,
+        }
+        for batch_idx in range(num_batches)
+        for chain in chains
+    ]
+    interface_rows = [
+        {
+            "example_id": example_id,
+            "chain_i_interface": chain_i,
+            "chain_j_interface": chain_j,
+            "pae_interface": confidence_data["interface_wise_mean_pae"][
+                (chain_i, chain_j)
+            ][batch_idx],
+            "pde_interface": confidence_data["interface_wise_mean_pde"][
+                (chain_i, chain_j)
+            ][batch_idx],
+            "min_pae_interface": confidence_data["interface_wise_min_pae"][
+                (chain_i, chain_j)
+            ][batch_idx],
+            "min_pde_interface": confidence_data["interface_wise_min_pde"][
+                (chain_i, chain_j)
+            ][batch_idx],
+            "overall_plddt": confidence_data["mean_plddt"][batch_idx],
+            "overall_pde": confidence_data["mean_pde"][batch_idx],
+            "overall_pae": confidence_data["mean_pae"][batch_idx],
+            "batch_idx": batch_idx,
+        }
+        for batch_idx in range(num_batches)
+        for (chain_i, chain_j) in chain_pairs
+    ]
+    return {
+        "confidence_df": pd.DataFrame(itertools.chain([*chain_rows, *interface_rows])),
+        "plddt": plddt,
+        "pae": pae,
+        "pde": pde,
+    }
+def compile_af3_style_confidence_outputs(
+    plddt_logits: torch.Tensor,
+    pae_logits: torch.Tensor,
+    pde_logits: torch.Tensor,
+    chain_iid_token_lvl: torch.Tensor | np.ndarray,
+    is_real_atom: torch.Tensor,
+    atom_array: AtomArray,
+    confidence_loss_cfg: DictConfig | dict,
+    batch_idx: int = 0,
+) -> dict[str, Any]:
+    """Compile confidence outputs in AlphaFold3-compatible format.
+    Returns a dict with:
+        - summary_confidences: Dict for {name}_summary_confidences.json
+        - confidences: Dict for {name}_confidences.json (per-atom data)
+        - plddt, pae, pde: Raw tensors for further processing
+    """
+    # Unbin logits
+    plddt = unbin_logits(
+        plddt_logits.reshape(
+            -1,
+            plddt_logits.shape[1],
+            NHEAVY,
+            confidence_loss_cfg.plddt.n_bins,
+        )
+        .permute(0, 3, 1, 2)
+        .float(),
+        confidence_loss_cfg.plddt.max_value,
+        confidence_loss_cfg.plddt.n_bins,
+    )
+    pae = unbin_logits(
+        pae_logits.permute(0, 3, 1, 2).float(),
+        confidence_loss_cfg.pae.max_value,
+        confidence_loss_cfg.pae.n_bins,
+    )
+    pde = unbin_logits(
+        pde_logits.permute(0, 3, 1, 2).float(),
+        confidence_loss_cfg.pde.max_value,
+        confidence_loss_cfg.pde.n_bins,
+    )
+    # Get chain information
+    if isinstance(chain_iid_token_lvl, torch.Tensor):
+        chain_iid_token_lvl = chain_iid_token_lvl.cpu().numpy()
+    chains = list(np.unique(chain_iid_token_lvl))
+    n_chains = len(chains)
+    # Calculate chainwise metrics
+    chain_masks_1d = create_chainwise_masks_1d(
+        chain_iid_token_lvl, device=is_real_atom.device
+    )
+    chain_masks_2d = create_chainwise_masks_2d(chain_iid_token_lvl, device=pae.device)
+    # Chain-level pLDDT
+    chain_plddt = {}
+    for chain, mask in chain_masks_1d.items():
+        chain_plddt[chain] = compute_mean_over_subsampled_pairs(
+            plddt, is_real_atom[..., :NHEAVY] * mask[:, None]
+        )[batch_idx].item()
+    # Chain-level PAE (intra-chain)
+    chain_pae = {}
+    for chain, mask in chain_masks_2d.items():
+        chain_pae[chain] = compute_mean_over_subsampled_pairs(pae, mask)[
+            batch_idx
+        ].item()
+    # Chain-pair PAE/PDE (inter-chain, for iptm-like metric)
+    interface_masks = create_interface_masks_2d(chain_iid_token_lvl, device=pae.device)
+    chain_pair_pae = {}
+    chain_pair_pae_min = {}
+    chain_pair_pde = {}
+    chain_pair_pde_min = {}
+    for (chain_i, chain_j), mask in interface_masks.items():
+        chain_pair_pae[(chain_i, chain_j)] = compute_mean_over_subsampled_pairs(
+            pae, mask
+        )[batch_idx].item()
+        chain_pair_pae_min[(chain_i, chain_j)] = compute_min_over_subsampled_pairs(
+            pae, mask
+        )[batch_idx].item()
+        chain_pair_pde[(chain_i, chain_j)] = compute_mean_over_subsampled_pairs(
+            pde, mask
+        )[batch_idx].item()
+        chain_pair_pde_min[(chain_i, chain_j)] = compute_min_over_subsampled_pairs(
+            pde, mask
+        )[batch_idx].item()
+    # Overall metrics for this batch
+    overall_plddt = compute_mean_over_subsampled_pairs(
+        plddt, is_real_atom[..., :NHEAVY]
+    )[batch_idx].item()
+    overall_pae = pae[batch_idx].mean().item()
+    overall_pde = pde[batch_idx].mean().item()
+    # Build chain_pair matrices (NxN)
+    chain_pair_pae_matrix = [[None] * n_chains for _ in range(n_chains)]
+    chain_pair_pae_min_matrix = [[None] * n_chains for _ in range(n_chains)]
+    chain_pair_pde_matrix = [[None] * n_chains for _ in range(n_chains)]
+    chain_pair_pde_min_matrix = [[None] * n_chains for _ in range(n_chains)]
+    for i, chain_i in enumerate(chains):
+        for j, chain_j in enumerate(chains):
+            if i != j and (chain_i, chain_j) in chain_pair_pae:
+                chain_pair_pae_matrix[i][j] = round(
+                    chain_pair_pae[(chain_i, chain_j)], 2
+                )
+                chain_pair_pae_min_matrix[i][j] = round(
+                    chain_pair_pae_min[(chain_i, chain_j)], 2
+                )
+                chain_pair_pde_matrix[i][j] = round(
+                    chain_pair_pde[(chain_i, chain_j)], 2
+                )
+                chain_pair_pde_min_matrix[i][j] = round(
+                    chain_pair_pde_min[(chain_i, chain_j)], 2
+                )
+    # Extract per-atom pLDDT values
+    atom_plddts = plddt[batch_idx][is_real_atom[..., :NHEAVY]].cpu().tolist()
+    # Extract atom/token chain and residue info from atom_array
+    atom_chain_ids = atom_array.chain_id.tolist()
+    token_chain_ids = list(chain_iid_token_lvl)
+    token_res_ids = list(
+        range(len(chain_iid_token_lvl))
+    )  # Simplified; could map to actual res_id
+    # PAE matrix for this batch
+    pae_matrix = pae[batch_idx].cpu().tolist()
+    # Build summary_confidences (AlphaFold3-style + RF3 extensions)
+    summary_confidences = {
+        "chain_ptm": [round(chain_plddt.get(c, 0.0), 2) for c in chains],
+        "chain_pair_pae_min": chain_pair_pae_min_matrix,
+        "chain_pair_pde_min": chain_pair_pde_min_matrix,
+        "chain_pair_pae": chain_pair_pae_matrix,
+        "chain_pair_pde": chain_pair_pde_matrix,
+        "overall_plddt": round(overall_plddt, 4),
+        "overall_pde": round(overall_pde, 4),
+        "overall_pae": round(overall_pae, 4),
+        # Note: ptm, iptm, has_clash should be populated from metrics_output
+    }
+    # Build full confidences (per-atom data)
+    confidences = {
+        "atom_chain_ids": atom_chain_ids,
+        "atom_plddts": [round(p, 2) for p in atom_plddts],
+        "pae": [[round(v, 2) for v in row] for row in pae_matrix],
+        "token_chain_ids": token_chain_ids,
+        "token_res_ids": token_res_ids,
+    }
+    return {
+        "summary_confidences": summary_confidences,
+        "confidences": confidences,
+        "plddt": plddt,
+        "pae": pae,
+        "pde": pde,
+    }
+def compute_batch_indices_with_lowest_predicted_error(
+    plddt: torch.Tensor,
+    is_real_atom: torch.Tensor,
+    pae: torch.Tensor,
+    confidence_loss_cfg: dict | DictConfig,
+    chain_iid_token_lvl: torch.Tensor,
+    is_ligand: torch.Tensor,
+    interfaces_to_score: list[tuple],
+    pn_units_to_score: list[tuple],
+) -> dict[str, Any]:
+    """Given the confidence logits, computes the index within the diffusion batch of the best predicted structure.
+    Metrics include pAE, pLDDT, and pDE, among others.
+    Returns:
+        dict[str, Any]: A dictionary containing the following keys:
+            - pae_idx: The index within the diffusion batch of the structure with the best overall pAE (Predicted Aligned Error)
+            - pde_idx: The index within the diffusion batch of the structure with the best overall pDE (Predicted Distance Error)
+            - plddt_idx: The index within the diffusion batch of the structure with the best overall pLDDT (Predicted Local Distance
+            Difference Test)
+            - best_chain_to_all_idx: The index within the diffusion batch of the structure with the best pAE subsampled over any
+            pair (i,j) where i == chain or j == chain
+            - best_chain_to_self_idx: The index within the diffusion batch of the structure with the best pAE subsampled over any
+            pair (i,j) where i == chain and j == chain
+            - best_interface_idx: For each interface between two scored PN Units, the index within the diffusion batch of the
+            structure with the best mean pAE for all (i,j) where i == interface_chain or j == interface_chain and i != j
+            - best_lig_ipae_idx: The index within the diffusion batch for the best pAE subsambled over any pair (i,j)
+            where i == chain or j == chain and i != j and i or j is a ligand
+    """
+    # TODO: Have this function take an `AtomArray` as input so we quickly build masks with much less code
+    # TODO: Explore how we can write this function more concisely
+    return_dict = {}
+    # AF3's ranking metrics work like this, but using ptm instead of ipae:
+    scored_chains, interfaces, interface_chains = _select_scored_units(
+        interfaces_to_score, pn_units_to_score
+    )
+    chain_to_all_masks = _create_chain_to_all_masks(chain_iid_token_lvl, scored_chains)
+    chain_to_self_masks = _create_chain_to_self_masks(
+        chain_iid_token_lvl, scored_chains
+    )
+    interface_masks, lig_chains = _create_interface_masks(
+        chain_iid_token_lvl, interfaces, is_ligand
+    )
+    # map everything to gpu
+    gpu = plddt.device
+    chain_to_all_masks = tree.map_structure(
+        lambda x: x.to(gpu) if hasattr(x, "cpu") else x, chain_to_all_masks
+    )
+    chain_to_self_masks = tree.map_structure(
+        lambda x: x.to(gpu) if hasattr(x, "cpu") else x, chain_to_self_masks
+    )
+    interface_masks = tree.map_structure(
+        lambda x: x.to(gpu) if hasattr(x, "cpu") else x, interface_masks
+    )
+    # Reshape logits to B, K, L, NHEAVY
+    plddt = (
+        plddt.reshape(
+            -1,
+            plddt.shape[1],
+            NHEAVY,
+            confidence_loss_cfg.plddt.n_bins,
+        )
+        .permute(0, 3, 1, 2)
+        .float()
+    )
+    # Reshape the pae and pde logits to B, K, L, L
+    pae_logits = pae.permute(0, 3, 1, 2).float()
+    pde_logits = pae.permute(0, 3, 1, 2).float()
+    pae_logits_unbinned = unbin_logits(
+        pae_logits, confidence_loss_cfg.pae.max_value, confidence_loss_cfg.pae.n_bins
+    )
+    plddt_logits_unbinned = unbin_logits(
+        plddt, confidence_loss_cfg.plddt.max_value, confidence_loss_cfg.plddt.n_bins
+    )
+    pde_logits_unbinned = unbin_logits(
+        pde_logits, confidence_loss_cfg.pde.max_value, confidence_loss_cfg.pde.n_bins
+    )
+    complex_pae = pae_logits_unbinned.mean(dim=(1, 2))
+    complex_pde = pde_logits_unbinned.mean(dim=(1, 2))
+    complex_plddt = (plddt_logits_unbinned * is_real_atom[..., :NHEAVY]).sum(
+        dim=(1, 2)
+    ) / is_real_atom[..., :NHEAVY].sum()
+    return_dict["pae_idx"] = torch.argmin(complex_pae)
+    return_dict["pde_idx"] = torch.argmin(complex_pde)
+    return_dict["plddt_idx"] = torch.argmax(complex_plddt)
+    chain_to_self_paes = _get_masked_error_per_chain(
+        scored_chains, chain_to_self_masks, pae_logits_unbinned
+    )
+    chain_to_all_paes = _get_masked_error_per_chain(
+        scored_chains, chain_to_all_masks, pae_logits_unbinned
+    )
+    interface_chain_paes = _get_masked_error_per_chain(
+        interface_chains, interface_masks, pae_logits_unbinned
+    )
+    # average over both interfaces
+    average_interface_paes = _get_average_error_per_interface(
+        interfaces, lig_chains, interface_chain_paes
+    )
+    return_dict["best_chain_to_all_idx"] = _get_lowest_error_indices(chain_to_all_paes)
+    return_dict["best_chain_to_self_idx"] = _get_lowest_error_indices(
+        chain_to_self_paes
+    )
+    return_dict["best_interface_idx"] = _get_lowest_error_indices(
+        average_interface_paes
+    )
+    # for ligands, we don't average the error
+    return_dict["best_lig_ipae_idx"] = _get_lowest_error_ligand_indices(
+        interface_chain_paes, interfaces, lig_chains
+    )
+    return return_dict
+def annotate_atom_array_b_factor_with_plddt(
+    atom_array: AtomArray | AtomArrayStack,
+    plddt: torch.Tensor,
+    is_real_atom: torch.Tensor,
+) -> List[AtomArray]:
+    """Annotates the b_factor of an AtomArray with the pLDDT values in the occupancy field.
+    Args:
+        atom_array: The AtomArray or AtomArrayStack to annotate
+        plddt: The pLDDT tensor of shape (B, I, NHEAVY)
+        is_real_atom: A mask indicating which atoms are in the structure of shape (I, NHEAVY)
+    Returns:
+        list[AtomArray]: The annotated list of AtomArrays. We must return a list of AtomArrays
+            because the AtomArray class does not support setting different values as annotations
+            other than the coordinate feature.
+    """
+    atom_wise_plddt = plddt[:, is_real_atom[..., :NHEAVY]]
+    assert atom_wise_plddt.shape[1] == atom_array.array_length()
+    atom_array_list = []
+    # bitotite's AtomArray does not support setting different values as annotations other than
+    # the coordinate feature, so we convert atom_array to a list of AtomArrays
+    if isinstance(atom_array, AtomArrayStack):
+        for i, aa in enumerate(atom_array):
+            aa.set_annotation("b_factor", atom_wise_plddt[i].cpu().numpy())
+            atom_array_list.append(aa)
+    else:
+        assert atom_wise_plddt.shape[0] == 1
+        atom_array.set_annotation("b_factor", atom_wise_plddt[0].cpu().numpy())
+        atom_array_list.append(atom_array)
+    for aa in atom_array_list:
+        assert np.isnan(aa.b_factor).sum() == 0
+    return atom_array_list
+def _select_scored_units(
+    interfaces_to_score: list[tuple], pn_units_to_score: list[tuple]
+):
+    scored_chains = []
+    interfaces = []
+    interface_chains = []
+    for k in interfaces_to_score:
+        interfaces.append(f"{k[0]}-{k[1]}")
+        interface_chains.append(k[0])
+        interface_chains.append(k[1])
+    for k in pn_units_to_score:
+        scored_chains.append(k[0])
+    return scored_chains, interfaces, interface_chains
+def _create_chain_to_all_masks(ch_label, chains_to_score):
+    unique_chains = np.unique(ch_label)
+    I = len(ch_label)
+    chain_to_all_masks = {}
+    for chain in unique_chains:
+        if chain in chains_to_score:
+            indices = torch.from_numpy((ch_label == chain))
+            mask = indices.unsqueeze(0) | indices.unsqueeze(1)
+            # set the diagonal to false
+            mask = mask & ~torch.eye(I, device=mask.device, dtype=torch.bool)
+            chain_to_all_masks[chain] = mask
+    return chain_to_all_masks
+def _create_chain_to_self_masks(ch_label, chains_to_score):
+    unique_chains = np.unique(ch_label)
+    I = len(ch_label)
+    chain_to_self_masks = {}
+    for chain in unique_chains:
+        if chain in chains_to_score:
+            indices = torch.from_numpy((ch_label == chain))
+            mask = indices.unsqueeze(0) & indices.unsqueeze(1)
+            # set the diagonal to false
+            mask = mask & ~torch.eye(I, device=mask.device, dtype=torch.bool)
+            chain_to_self_masks[chain] = mask
+    return chain_to_self_masks
+def _create_interface_masks(ch_label, interfaces, is_ligand):
+    interface_masks = {}
+    interface_chains = []
+    ligand_chains = []
+    for interface in interfaces:
+        interface_chains.append(interface.split("-")[0])
+        interface_chains.append(interface.split("-")[1])
+    interface_chains = set(interface_chains)
+    for chain in interface_chains:
+        chain_indices = torch.from_numpy((ch_label == chain))
+        to_self = chain_indices.unsqueeze(0) & chain_indices.unsqueeze(1)
+        to_all = chain_indices.unsqueeze(0) | chain_indices.unsqueeze(1)
+        interface_mask = to_all & ~to_self
+        interface_masks[chain] = interface_mask
+        if torch.all(is_ligand[chain_indices]):
+            ligand_chains.append(chain)
+    return interface_masks, ligand_chains
+def _get_masked_error_per_chain(chains, masks, unbinned_logits):
+    error = {}
+    for chain in chains:
+        mask = masks[chain]
+        chain_error = compute_mean_over_subsampled_pairs(unbinned_logits, mask)
+        error[chain] = chain_error
+    return error
+def _get_average_error_per_interface(interfaces, lig_chains, interface_errors):
+    average_error = {}
+    for interface in interfaces:
+        chain_a = interface.split("-")[0]
+        chain_b = interface.split("-")[1]
+        average_error[interface] = (
+            interface_errors[chain_a] + interface_errors[chain_b]
+        ) / 2
+    return average_error
+def _get_lowest_error_indices(errors):
+    lowest_error_indices = {}
+    for k, v in errors.items():
+        lowest_error_indices[k] = torch.argmin(v)
+    return lowest_error_indices
+def _get_lowest_error_ligand_indices(errors, interfaces, lig_chains):
+    # ligands are a special case in AF3, where they only consider the ligand chain's error and not the average for the interface
+    lowest_error_indices = {}
+    for interface in interfaces:
+        chain_a = interface.split("-")[0]
+        chain_b = interface.split("-")[1]
+        if chain_a in lig_chains or chain_b in lig_chains:
+            if chain_a in lig_chains:
+                lig_chain = chain_a
+            elif chain_b in lig_chains:
+                lig_chain = chain_b
+            lowest_error_indices[interface] = torch.argmin(errors[lig_chain])
+        else:
+            # assign a random value to avoid key errors downstream; sorting ligand interfaces
+            # from other types is handles in analysis
+            lowest_error_indices[interface] = 0
+    return lowest_error_indices