PyPI - rc-foundry - Versions diffs - 0.1.1__py3-none-any.whl - Mend

rc-foundry 0.1.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (180) hide show

foundry/__init__.py +57 -0
foundry/callbacks/__init__.py +5 -0
foundry/callbacks/callback.py +116 -0
foundry/callbacks/health_logging.py +419 -0
foundry/callbacks/metrics_logging.py +211 -0
foundry/callbacks/timing_logging.py +67 -0
foundry/callbacks/train_logging.py +278 -0
foundry/common.py +108 -0
foundry/constants.py +28 -0
foundry/hydra/resolvers.py +77 -0
foundry/inference_engines/base.py +235 -0
foundry/inference_engines/checkpoint_registry.py +66 -0
foundry/metrics/__init__.py +12 -0
foundry/metrics/losses.py +30 -0
foundry/metrics/metric.py +319 -0
foundry/model/layers/blocks.py +47 -0
foundry/testing/__init__.py +6 -0
foundry/testing/fixtures.py +19 -0
foundry/testing/pytest_hooks.py +15 -0
foundry/trainers/fabric.py +923 -0
foundry/training/EMA.py +67 -0
foundry/training/checkpoint.py +61 -0
foundry/training/schedulers.py +91 -0
foundry/utils/alignment.py +86 -0
foundry/utils/components.py +415 -0
foundry/utils/datasets.py +405 -0
foundry/utils/ddp.py +103 -0
foundry/utils/instantiators.py +72 -0
foundry/utils/logging.py +279 -0
foundry/utils/rigid.py +1460 -0
foundry/utils/rotation_augmentation.py +65 -0
foundry/utils/squashfs.py +172 -0
foundry/utils/torch.py +317 -0
foundry/utils/weights.py +271 -0
foundry/version.py +34 -0
foundry_cli/__init__.py +3 -0
foundry_cli/download_checkpoints.py +281 -0
mpnn/__init__.py +1 -0
mpnn/collate/feature_collator.py +265 -0
mpnn/inference.py +53 -0
mpnn/inference_engines/mpnn.py +549 -0
mpnn/loss/nll_loss.py +122 -0
mpnn/metrics/nll.py +369 -0
mpnn/metrics/sequence_recovery.py +440 -0
mpnn/model/layers/graph_embeddings.py +2372 -0
mpnn/model/layers/message_passing.py +332 -0
mpnn/model/layers/position_wise_feed_forward.py +44 -0
mpnn/model/layers/positional_encoding.py +98 -0
mpnn/model/mpnn.py +2632 -0
mpnn/pipelines/mpnn.py +162 -0
mpnn/samplers/samplers.py +167 -0
mpnn/train.py +341 -0
mpnn/trainers/mpnn.py +193 -0
mpnn/transforms/feature_aggregation/mpnn.py +184 -0
mpnn/transforms/feature_aggregation/polymer_ligand_interface.py +76 -0
mpnn/transforms/feature_aggregation/token_encodings.py +132 -0
mpnn/transforms/feature_aggregation/user_settings.py +347 -0
mpnn/transforms/polymer_ligand_interface.py +164 -0
mpnn/utils/inference.py +2397 -0
mpnn/utils/probability.py +37 -0
mpnn/utils/weights.py +309 -0
rc_foundry-0.1.1.dist-info/METADATA +239 -0
rc_foundry-0.1.1.dist-info/RECORD +180 -0
rc_foundry-0.1.1.dist-info/WHEEL +4 -0
rc_foundry-0.1.1.dist-info/entry_points.txt +5 -0
rc_foundry-0.1.1.dist-info/licenses/LICENSE.md +28 -0
rf3/__init__.py +3 -0
rf3/_version.py +33 -0
rf3/alignment.py +79 -0
rf3/callbacks/dump_validation_structures.py +101 -0
rf3/callbacks/metrics_logging.py +324 -0
rf3/chemical.py +1529 -0
rf3/cli.py +77 -0
rf3/data/cyclic_transform.py +78 -0
rf3/data/extra_xforms.py +36 -0
rf3/data/ground_truth_template.py +463 -0
rf3/data/paired_msa.py +206 -0
rf3/data/pipeline_utils.py +128 -0
rf3/data/pipelines.py +558 -0
rf3/diffusion_samplers/inference_sampler.py +222 -0
rf3/inference.py +65 -0
rf3/inference_engines/__init__.py +5 -0
rf3/inference_engines/rf3.py +735 -0
rf3/kinematics.py +354 -0
rf3/loss/af3_confidence_loss.py +515 -0
rf3/loss/af3_losses.py +655 -0
rf3/loss/loss.py +179 -0
rf3/metrics/chiral.py +179 -0
rf3/metrics/clashing_chains.py +68 -0
rf3/metrics/distogram.py +421 -0
rf3/metrics/lddt.py +523 -0
rf3/metrics/metadata.py +43 -0
rf3/metrics/metric_utils.py +192 -0
rf3/metrics/predicted_error.py +134 -0
rf3/metrics/rasa.py +108 -0
rf3/metrics/selected_distances.py +91 -0
rf3/model/RF3.py +527 -0
rf3/model/RF3_blocks.py +92 -0
rf3/model/RF3_structure.py +303 -0
rf3/model/layers/af3_auxiliary_heads.py +255 -0
rf3/model/layers/af3_diffusion_transformer.py +544 -0
rf3/model/layers/attention.py +313 -0
rf3/model/layers/layer_utils.py +127 -0
rf3/model/layers/mlff.py +118 -0
rf3/model/layers/outer_product.py +59 -0
rf3/model/layers/pairformer_layers.py +783 -0
rf3/model/layers/structure_bias.py +56 -0
rf3/scoring.py +1787 -0
rf3/symmetry/resolve.py +284 -0
rf3/train.py +194 -0
rf3/trainers/rf3.py +570 -0
rf3/util_module.py +47 -0
rf3/utils/frames.py +109 -0
rf3/utils/inference.py +665 -0
rf3/utils/io.py +198 -0
rf3/utils/loss.py +72 -0
rf3/utils/predict_and_score.py +165 -0
rf3/utils/predicted_error.py +673 -0
rf3/utils/recycling.py +42 -0
rf3/validate.py +140 -0
rfd3/.gitignore +7 -0
rfd3/Makefile +76 -0
rfd3/__init__.py +12 -0
rfd3/callbacks.py +66 -0
rfd3/cli.py +41 -0
rfd3/constants.py +212 -0
rfd3/engine.py +543 -0
rfd3/inference/datasets.py +193 -0
rfd3/inference/input_parsing.py +1123 -0
rfd3/inference/legacy_input_parsing.py +717 -0
rfd3/inference/parsing.py +165 -0
rfd3/inference/symmetry/atom_array.py +298 -0
rfd3/inference/symmetry/checks.py +241 -0
rfd3/inference/symmetry/contigs.py +63 -0
rfd3/inference/symmetry/frames.py +355 -0
rfd3/inference/symmetry/symmetry_utils.py +398 -0
rfd3/metrics/design_metrics.py +465 -0
rfd3/metrics/hbonds_hbplus_metrics.py +308 -0
rfd3/metrics/hbonds_metrics.py +389 -0
rfd3/metrics/losses.py +325 -0
rfd3/metrics/metrics_utils.py +118 -0
rfd3/metrics/sidechain_metrics.py +349 -0
rfd3/model/RFD3.py +105 -0
rfd3/model/RFD3_diffusion_module.py +387 -0
rfd3/model/cfg_utils.py +81 -0
rfd3/model/inference_sampler.py +635 -0
rfd3/model/layers/attention.py +577 -0
rfd3/model/layers/block_utils.py +580 -0
rfd3/model/layers/blocks.py +777 -0
rfd3/model/layers/chunked_pairwise.py +377 -0
rfd3/model/layers/encoders.py +417 -0
rfd3/model/layers/layer_utils.py +197 -0
rfd3/model/layers/pairformer_layers.py +128 -0
rfd3/run_inference.py +45 -0
rfd3/testing/debug.py +139 -0
rfd3/testing/debug_utils.py +73 -0
rfd3/testing/testing_utils.py +356 -0
rfd3/train.py +194 -0
rfd3/trainer/dump_validation_structures.py +154 -0
rfd3/trainer/fabric_trainer.py +923 -0
rfd3/trainer/recycling.py +42 -0
rfd3/trainer/rfd3.py +485 -0
rfd3/trainer/trainer_utils.py +502 -0
rfd3/transforms/conditioning_base.py +508 -0
rfd3/transforms/conditioning_utils.py +200 -0
rfd3/transforms/design_transforms.py +807 -0
rfd3/transforms/dna_crop.py +523 -0
rfd3/transforms/hbonds.py +407 -0
rfd3/transforms/hbonds_hbplus.py +246 -0
rfd3/transforms/ncaa_transforms.py +153 -0
rfd3/transforms/pipelines.py +632 -0
rfd3/transforms/ppi_transforms.py +541 -0
rfd3/transforms/rasa.py +116 -0
rfd3/transforms/symmetry.py +76 -0
rfd3/transforms/training_conditions.py +552 -0
rfd3/transforms/util_transforms.py +498 -0
rfd3/transforms/virtual_atoms.py +305 -0
rfd3/utils/inference.py +648 -0
rfd3/utils/io.py +245 -0
rfd3/utils/vizualize.py +276 -0

mpnn/utils/probability.py ADDED Viewed

@@ -0,0 +1,37 @@
+import numpy as np
+def sample_bernoulli_rv(p):
+    """
+    Given a probability p, representing the success probability of a Bernoulli
+    distribution, sample X ~ Bernoulli(p).
+    Arguments:
+        p (float): a float between 0 and 1, representing the success probability
+            of a Bernoulli distribution.
+    Returns:
+        x (int): the result of sampling the random variable X ~ Bernoulli(p).
+            P(X = 1) = p
+            P(X = 0) = 1 - p.
+    """
+    # Check that 0 <= p <= 1.
+    if p < 0 or p > 1:
+        raise ValueError("The success probability p must be between 0 and 1 inclusive.")
+    # Handle the edge cases, otherwise utilize the numpy uniform distribution.
+    if p == 0:
+        x = 0
+    elif p == 1:
+        x = 1
+    else:
+        # Sample the Y ~ Uniform(0, 1) distribution.
+        uniform_sample = np.random.uniform(0.0, 1.0)
+        # P(Y < p) = p.
+        if uniform_sample < p:
+            x = 1
+        else:
+            x = 0
+    return x

mpnn/utils/weights.py ADDED Viewed

@@ -0,0 +1,309 @@
+import torch
+from mpnn.transforms.feature_aggregation.token_encodings import (
+    legacy_token_order,
+    token_order,
+)
+def load_legacy_weights(model: torch.nn.Module, weights_path: str) -> None:
+    """
+    Load a legacy MPNN checkpoint from 'weights_path' into 'model' (the
+    refactored MPNN implementation).
+    This performs several transformations:
+      - Copies certain non-learned registries (e.g., periodic table info) from
+        the new model into the checkpoint state dict (to match the new code).
+      - Renames legacy parameter/buffer names into the new module naming scheme.
+      - Fixes a 120->119 atom-type embedding weight size mismatch by dropping
+        the unused legacy atom type.
+      - Reorders pairwise backbone distance embedding weights to match the new
+        atom-pair ordering.
+      - Reorders token (AA) embeddings/projections weights from the legacy order
+        (alphabetical 1-letter) to the new order (alphabetical 3-letter).
+    """
+    # Load legacy checkpoint state dict.
+    checkpoint = torch.load(weights_path, map_location="cpu", weights_only=False)
+    checkpoint_state_dict = checkpoint["model_state_dict"]
+    # Values to copy directly from the *current* model into the state dict.
+    # These are effectively "configuration" tensors/registries, not learned
+    # weights we want to preserve from the legacy model.
+    values_to_copy = [
+        "graph_featurization_module.side_chain_atom_types",
+        "graph_featurization_module.periodic_table_groups",
+        "graph_featurization_module.periodic_table_periods",
+    ]
+    # Copy over some hard-coded registers/values.
+    for value_name in values_to_copy:
+        # Walk the attribute chain.
+        attr_list = value_name.split(".")
+        sub_module = model
+        while len(attr_list) > 1 and sub_module is not None:
+            attr = attr_list.pop(0)
+            if hasattr(sub_module, attr):
+                sub_module = getattr(sub_module, attr)
+            else:
+                sub_module = None
+        # If the current sub-module exists, and it has the final attribute,
+        # copy it into the checkpoint state dict.
+        if sub_module is not None:
+            if hasattr(sub_module, attr_list[0]):
+                checkpoint_state_dict[value_name] = getattr(sub_module, attr_list[0])
+    # Mapping of legacy weight names to new weight names.
+    # Left side = name in the old checkpoint.
+    # Right side = name expected by the new model implementation.
+    legacy_weight_to_new_weight = {
+        "features.embeddings.linear.weight": "graph_featurization_module.positional_embedding.embed_positional_features.weight",
+        "features.embeddings.linear.bias": "graph_featurization_module.positional_embedding.embed_positional_features.bias",
+        "features.edge_embedding.weight": "graph_featurization_module.edge_embedding.weight",
+        "features.norm_edges.weight": "graph_featurization_module.edge_norm.weight",
+        "features.norm_edges.bias": "graph_featurization_module.edge_norm.bias",
+        "context_encoder_layers.0.norm1.weight": "protein_ligand_context_encoder_layers.0.norm1.weight",
+        "context_encoder_layers.0.norm1.bias": "protein_ligand_context_encoder_layers.0.norm1.bias",
+        "context_encoder_layers.0.norm2.weight": "protein_ligand_context_encoder_layers.0.norm2.weight",
+        "context_encoder_layers.0.norm2.bias": "protein_ligand_context_encoder_layers.0.norm2.bias",
+        "context_encoder_layers.0.W1.weight": "protein_ligand_context_encoder_layers.0.W1.weight",
+        "context_encoder_layers.0.W1.bias": "protein_ligand_context_encoder_layers.0.W1.bias",
+        "context_encoder_layers.0.W2.weight": "protein_ligand_context_encoder_layers.0.W2.weight",
+        "context_encoder_layers.0.W2.bias": "protein_ligand_context_encoder_layers.0.W2.bias",
+        "context_encoder_layers.0.W3.weight": "protein_ligand_context_encoder_layers.0.W3.weight",
+        "context_encoder_layers.0.W3.bias": "protein_ligand_context_encoder_layers.0.W3.bias",
+        "context_encoder_layers.0.dense.W_in.weight": "protein_ligand_context_encoder_layers.0.dense.W_in.weight",
+        "context_encoder_layers.0.dense.W_in.bias": "protein_ligand_context_encoder_layers.0.dense.W_in.bias",
+        "context_encoder_layers.0.dense.W_out.weight": "protein_ligand_context_encoder_layers.0.dense.W_out.weight",
+        "context_encoder_layers.0.dense.W_out.bias": "protein_ligand_context_encoder_layers.0.dense.W_out.bias",
+        "context_encoder_layers.1.norm1.weight": "protein_ligand_context_encoder_layers.1.norm1.weight",
+        "context_encoder_layers.1.norm1.bias": "protein_ligand_context_encoder_layers.1.norm1.bias",
+        "context_encoder_layers.1.norm2.weight": "protein_ligand_context_encoder_layers.1.norm2.weight",
+        "context_encoder_layers.1.norm2.bias": "protein_ligand_context_encoder_layers.1.norm2.bias",
+        "context_encoder_layers.1.W1.weight": "protein_ligand_context_encoder_layers.1.W1.weight",
+        "context_encoder_layers.1.W1.bias": "protein_ligand_context_encoder_layers.1.W1.bias",
+        "context_encoder_layers.1.W2.weight": "protein_ligand_context_encoder_layers.1.W2.weight",
+        "context_encoder_layers.1.W2.bias": "protein_ligand_context_encoder_layers.1.W2.bias",
+        "context_encoder_layers.1.W3.weight": "protein_ligand_context_encoder_layers.1.W3.weight",
+        "context_encoder_layers.1.W3.bias": "protein_ligand_context_encoder_layers.1.W3.bias",
+        "context_encoder_layers.1.dense.W_in.weight": "protein_ligand_context_encoder_layers.1.dense.W_in.weight",
+        "context_encoder_layers.1.dense.W_in.bias": "protein_ligand_context_encoder_layers.1.dense.W_in.bias",
+        "context_encoder_layers.1.dense.W_out.weight": "protein_ligand_context_encoder_layers.1.dense.W_out.weight",
+        "context_encoder_layers.1.dense.W_out.bias": "protein_ligand_context_encoder_layers.1.dense.W_out.bias",
+        "y_context_encoder_layers.0.norm1.weight": "ligand_context_encoder_layers.0.norm1.weight",
+        "y_context_encoder_layers.0.norm1.bias": "ligand_context_encoder_layers.0.norm1.bias",
+        "y_context_encoder_layers.0.norm2.weight": "ligand_context_encoder_layers.0.norm2.weight",
+        "y_context_encoder_layers.0.norm2.bias": "ligand_context_encoder_layers.0.norm2.bias",
+        "y_context_encoder_layers.0.W1.weight": "ligand_context_encoder_layers.0.W1.weight",
+        "y_context_encoder_layers.0.W1.bias": "ligand_context_encoder_layers.0.W1.bias",
+        "y_context_encoder_layers.0.W2.weight": "ligand_context_encoder_layers.0.W2.weight",
+        "y_context_encoder_layers.0.W2.bias": "ligand_context_encoder_layers.0.W2.bias",
+        "y_context_encoder_layers.0.W3.weight": "ligand_context_encoder_layers.0.W3.weight",
+        "y_context_encoder_layers.0.W3.bias": "ligand_context_encoder_layers.0.W3.bias",
+        "y_context_encoder_layers.0.dense.W_in.weight": "ligand_context_encoder_layers.0.dense.W_in.weight",
+        "y_context_encoder_layers.0.dense.W_in.bias": "ligand_context_encoder_layers.0.dense.W_in.bias",
+        "y_context_encoder_layers.0.dense.W_out.weight": "ligand_context_encoder_layers.0.dense.W_out.weight",
+        "y_context_encoder_layers.0.dense.W_out.bias": "ligand_context_encoder_layers.0.dense.W_out.bias",
+        "y_context_encoder_layers.1.norm1.weight": "ligand_context_encoder_layers.1.norm1.weight",
+        "y_context_encoder_layers.1.norm1.bias": "ligand_context_encoder_layers.1.norm1.bias",
+        "y_context_encoder_layers.1.norm2.weight": "ligand_context_encoder_layers.1.norm2.weight",
+        "y_context_encoder_layers.1.norm2.bias": "ligand_context_encoder_layers.1.norm2.bias",
+        "y_context_encoder_layers.1.W1.weight": "ligand_context_encoder_layers.1.W1.weight",
+        "y_context_encoder_layers.1.W1.bias": "ligand_context_encoder_layers.1.W1.bias",
+        "y_context_encoder_layers.1.W2.weight": "ligand_context_encoder_layers.1.W2.weight",
+        "y_context_encoder_layers.1.W2.bias": "ligand_context_encoder_layers.1.W2.bias",
+        "y_context_encoder_layers.1.W3.weight": "ligand_context_encoder_layers.1.W3.weight",
+        "y_context_encoder_layers.1.W3.bias": "ligand_context_encoder_layers.1.W3.bias",
+        "y_context_encoder_layers.1.dense.W_in.weight": "ligand_context_encoder_layers.1.dense.W_in.weight",
+        "y_context_encoder_layers.1.dense.W_in.bias": "ligand_context_encoder_layers.1.dense.W_in.bias",
+        "y_context_encoder_layers.1.dense.W_out.weight": "ligand_context_encoder_layers.1.dense.W_out.weight",
+        "y_context_encoder_layers.1.dense.W_out.bias": "ligand_context_encoder_layers.1.dense.W_out.bias",
+        "features.node_project_down.weight": "graph_featurization_module.node_embedding.weight",
+        "features.node_project_down.bias": "graph_featurization_module.node_embedding.bias",
+        "features.norm_nodes.weight": "graph_featurization_module.node_norm.weight",
+        "features.norm_nodes.bias": "graph_featurization_module.node_norm.bias",
+        "features.type_linear.weight": "graph_featurization_module.embed_atom_type_features.weight",
+        "features.type_linear.bias": "graph_featurization_module.embed_atom_type_features.bias",
+        "features.y_nodes.weight": "graph_featurization_module.ligand_subgraph_node_embedding.weight",
+        "features.y_edges.weight": "graph_featurization_module.ligand_subgraph_edge_embedding.weight",
+        "features.norm_y_edges.weight": "graph_featurization_module.ligand_subgraph_edge_norm.weight",
+        "features.norm_y_edges.bias": "graph_featurization_module.ligand_subgraph_edge_norm.bias",
+        "features.norm_y_nodes.weight": "graph_featurization_module.ligand_subgraph_node_norm.weight",
+        "features.norm_y_nodes.bias": "graph_featurization_module.ligand_subgraph_node_norm.bias",
+        "W_v.weight": "W_protein_to_ligand_edges_embed.weight",
+        "W_v.bias": "W_protein_to_ligand_edges_embed.bias",
+        "W_c.weight": "W_protein_encoding_embed.weight",
+        "W_c.bias": "W_protein_encoding_embed.bias",
+        "W_nodes_y.weight": "W_ligand_nodes_embed.weight",
+        "W_nodes_y.bias": "W_ligand_nodes_embed.bias",
+        "W_edges_y.weight": "W_ligand_edges_embed.weight",
+        "W_edges_y.bias": "W_ligand_edges_embed.bias",
+        "V_C.weight": "W_final_context_embed.weight",
+        "V_C_norm.weight": "final_context_norm.weight",
+        "V_C_norm.bias": "final_context_norm.bias",
+    }
+    # Rename the weights in the checkpoint state dict.
+    for legacy_weight_name, new_weight_name in legacy_weight_to_new_weight.items():
+        if legacy_weight_name in checkpoint_state_dict:
+            checkpoint_state_dict[new_weight_name] = checkpoint_state_dict.pop(
+                legacy_weight_name
+            )
+    # Remove unused atom type embedding weight.
+    # - Previous LigandMPNN used 120 atom types, but the last one was unused.
+    # - The new model uses 119 atom types.
+    atom_type_embedding_keys = [
+        "graph_featurization_module.embed_atom_type_features.weight",
+        "graph_featurization_module.ligand_subgraph_node_embedding.weight",
+    ]
+    # For each of these keys, drop the unused atom type embedding.
+    for key in atom_type_embedding_keys:
+        if key in checkpoint_state_dict:
+            legacy_weight = checkpoint_state_dict[key]
+            num_atomic_numbers = model.graph_featurization_module.num_atomic_numbers
+            checkpoint_state_dict[key] = torch.cat(
+                [
+                    legacy_weight[:, :num_atomic_numbers],
+                    legacy_weight[:, num_atomic_numbers + 1 :],
+                ],
+                dim=1,
+            )
+    # Permute weights for embedding of pairwise backbone atom distances.
+    # - The legacy model used the order specified in 'legacy_order' dict.
+    # - The new model uses the order specified in 'new_order' list (the
+    # outer product of the atom types in the order N, Ca, C, O, Cb).
+    legacy_order = {
+        "Ca-Ca": 0,
+        "N-N": 1,
+        "C-C": 2,
+        "O-O": 3,
+        "Cb-Cb": 4,
+        "Ca-N": 5,
+        "Ca-C": 6,
+        "Ca-O": 7,
+        "Ca-Cb": 8,
+        "N-C": 9,
+        "N-O": 10,
+        "N-Cb": 11,
+        "Cb-C": 12,
+        "Cb-O": 13,
+        "O-C": 14,
+        "N-Ca": 15,
+        "C-Ca": 16,
+        "O-Ca": 17,
+        "Cb-Ca": 18,
+        "C-N": 19,
+        "O-N": 20,
+        "Cb-N": 21,
+        "C-Cb": 22,
+        "O-Cb": 23,
+        "C-O": 24,
+    }
+    new_order = [
+        "N-N",
+        "N-Ca",
+        "N-C",
+        "N-O",
+        "N-Cb",
+        "Ca-N",
+        "Ca-Ca",
+        "Ca-C",
+        "Ca-O",
+        "Ca-Cb",
+        "C-N",
+        "C-Ca",
+        "C-C",
+        "C-O",
+        "C-Cb",
+        "O-N",
+        "O-Ca",
+        "O-C",
+        "O-O",
+        "O-Cb",
+        "Cb-N",
+        "Cb-Ca",
+        "Cb-C",
+        "Cb-O",
+        "Cb-Cb",
+    ]
+    pairwise_backbone_atom_embeddings_keys = [
+        "graph_featurization_module.edge_embedding.weight",
+    ]
+    for key in pairwise_backbone_atom_embeddings_keys:
+        if key in checkpoint_state_dict:
+            # Grab the legacy weight and shape.
+            legacy_weight = checkpoint_state_dict[key]
+            out_dim, _ = legacy_weight.shape
+            # Grab the necessary dimensions from the model.
+            num_positional_embeddings = (
+                model.graph_featurization_module.num_positional_embeddings
+            )
+            num_atoms = (
+                model.graph_featurization_module.num_backbone_atoms
+                + model.graph_featurization_module.num_virtual_atoms
+            )
+            num_rbf = model.graph_featurization_module.num_rbf
+            # Split positional and RBF embedding weights.
+            legacy_weight_positional_embeddings = legacy_weight[
+                :, :num_positional_embeddings
+            ]
+            legacy_weight_rbf_embeddings_flat = legacy_weight[
+                :, num_positional_embeddings:
+            ]
+            # Reshape the weights to separate atom pairs and the rbf dimension.
+            legacy_weight_rbf_embeddings_atom_pairs = (
+                legacy_weight_rbf_embeddings_flat.view(
+                    out_dim, num_atoms * num_atoms, num_rbf
+                )
+            )
+            # Reorder the atom pairs to match the new order.
+            new_weight_rbf_embeddings_atom_pairs = (
+                legacy_weight_rbf_embeddings_atom_pairs[
+                    :, [legacy_order[atom_pair_name] for atom_pair_name in new_order], :
+                ]
+            )
+            # Flatten the reordered weights back to 2D.
+            new_weight_rbf_embeddings_flat = (
+                new_weight_rbf_embeddings_atom_pairs.reshape(
+                    out_dim, num_atoms * num_atoms * num_rbf
+                )
+            )
+            # Concatenate positional + reordered RBF
+            checkpoint_state_dict[key] = torch.cat(
+                [legacy_weight_positional_embeddings, new_weight_rbf_embeddings_flat],
+                dim=1,
+            )
+    # Permute the token order of amino acids coming out of the model to match
+    # the new vocabulary order.
+    # - The legacy model used an order specified by alphabetic order of one-
+    # letter amino acid codes.
+    # - The new model uses an order specified by alphabetic order of three-
+    # letter amino acid codes.
+    token_embedding_keys = ["W_s.weight"]
+    token_projection_keys = ["W_out.weight", "W_out.bias"]
+    # For each of these keys, reorder the embeddings/projections.
+    for key in token_embedding_keys + token_projection_keys:
+        if key in checkpoint_state_dict:
+            # Grab the old weight.
+            legacy_weight = checkpoint_state_dict[key]
+            # Reorder the weight/bias according to the new token order.
+            if "weight" in key:
+                checkpoint_state_dict[key] = legacy_weight[
+                    [legacy_token_order.index(aa) for aa in token_order], :
+                ]
+            elif "bias" in key:
+                checkpoint_state_dict[key] = legacy_weight[
+                    [legacy_token_order.index(aa) for aa in token_order]
+                ]
+            else:
+                raise ValueError(f"Unrecognized key for token projection: {key}")
+    # Load the modified state dict into the model.
+    model.load_state_dict(checkpoint_state_dict, strict=True)

rc_foundry-0.1.1.dist-info/METADATA ADDED Viewed

@@ -0,0 +1,239 @@
+Metadata-Version: 2.4
+Name: rc-foundry
+Version: 0.1.1
+Summary: Shared utilities and training infrastructure for biomolecular structure prediction models.
+Author-email: Institute for Protein Design <contact@ipd.uw.edu>
+License: BSD 3-Clause License
+        Copyright (c) 2025, Institute for Protein Design, University of Washington
+        Redistribution and use in source and binary forms, with or without
+        modification, are permitted provided that the following conditions are met:
+        * Redistributions of source code must retain the above copyright notice, this
+          list of conditions and the following disclaimer.
+        * Redistributions in binary form must reproduce the above copyright notice,
+          this list of conditions and the following disclaimer in the documentation
+          and/or other materials provided with the distribution.
+        * Neither the name of the copyright holder nor the names of its
+          contributors may be used to endorse or promote products derived from
+          this software without specific prior written permission.
+        THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
+        AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+        IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+        DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
+        FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+        DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
+        SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
+        CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
+        OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+        OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+License-File: LICENSE.md
+Classifier: Intended Audience :: Developers
+Classifier: Intended Audience :: Science/Research
+Classifier: License :: OSI Approved :: BSD License
+Classifier: Natural Language :: English
+Classifier: Operating System :: MacOS
+Classifier: Operating System :: Microsoft :: Windows
+Classifier: Operating System :: POSIX :: Linux
+Classifier: Programming Language :: Python :: 3
+Classifier: Programming Language :: Python :: Implementation :: CPython
+Classifier: Topic :: Scientific/Engineering :: Bio-Informatics
+Requires-Python: >=3.12
+Requires-Dist: assertpy
+Requires-Dist: atomworks[ml]>=2.1.1
+Requires-Dist: beartype<1,>=0.18.0
+Requires-Dist: dm-tree<1,>=0.1.6
+Requires-Dist: einops<1,>=0.8.0
+Requires-Dist: einx<1,>=0.1.0
+Requires-Dist: environs<12,>=11.0.0
+Requires-Dist: hydra-core<1.4,>=1.3.0
+Requires-Dist: ipykernel>=6.31.0
+Requires-Dist: jaxtyping<1,>=0.2.17
+Requires-Dist: lightning>=2.5.0
+Requires-Dist: loralib>=0.1.1
+Requires-Dist: opt-einsum<4,>=3.4.0
+Requires-Dist: pandas
+Requires-Dist: rich>=13.9.4
+Requires-Dist: rootutils<1.1,>=1.0.7
+Requires-Dist: toolz
+Requires-Dist: torch<3,>=2.2.0
+Requires-Dist: typer<1,>=0.20.0
+Requires-Dist: wandb<1,>=0.15.10
+Requires-Dist: zstandard
+Provides-Extra: all
+Requires-Dist: cuequivariance-ops-cu12>=0.6.1; (sys_platform == 'linux') and extra == 'all'
+Requires-Dist: cuequivariance-ops-torch-cu12>=0.6.1; (sys_platform == 'linux') and extra == 'all'
+Requires-Dist: cuequivariance-torch>=0.6.1; (sys_platform == 'linux') and extra == 'all'
+Requires-Dist: pydantic>=2.8; extra == 'all'
+Provides-Extra: dev
+Requires-Dist: assertpy; extra == 'dev'
+Requires-Dist: atomworks[dev,ml,openbabel]>=2.1.1; extra == 'dev'
+Requires-Dist: debugpy<2,>=1.8.5; extra == 'dev'
+Requires-Dist: ipdb; extra == 'dev'
+Requires-Dist: ipykernel<7,>=6.29.4; extra == 'dev'
+Requires-Dist: pre-commit; extra == 'dev'
+Requires-Dist: pytest-benchmark<6,>=5.0.0; extra == 'dev'
+Requires-Dist: pytest-cov<5,>=4.1.0; extra == 'dev'
+Requires-Dist: pytest-dotenv<1,>=0.5.2; extra == 'dev'
+Requires-Dist: pytest-testmon<3,>=2.1.1; extra == 'dev'
+Requires-Dist: pytest-xdist<4,>=3.6.1; extra == 'dev'
+Requires-Dist: pytest<9,>=8.2.0; extra == 'dev'
+Requires-Dist: ruff==0.8.3; extra == 'dev'
+Provides-Extra: rf3
+Requires-Dist: cuequivariance-ops-cu12>=0.6.1; (sys_platform == 'linux') and extra == 'rf3'
+Requires-Dist: cuequivariance-ops-torch-cu12>=0.6.1; (sys_platform == 'linux') and extra == 'rf3'
+Requires-Dist: cuequivariance-torch>=0.6.1; (sys_platform == 'linux') and extra == 'rf3'
+Provides-Extra: rfd3
+Requires-Dist: pydantic>=2.8; extra == 'rfd3'
+Description-Content-Type: text/markdown
+# Protein design with Foundry
+Foundry provides tooling and infrastructure for using and training all classes of models for protein design, including design (RFD3), inverse folding (ProteinMPNN) and protein folding (RF3).
+All models within Foundry rely on [AtomWorks](https://github.com/RosettaCommons/atomworks) - a unified framework for manipulating and processing biomolecular structures - for both training and inference.
+## Getting Started
+### Quickstart guide
+**Installation**
+```bash
+pip install rc-foundry[all]
+```
+**Downloading weights** All models can be downloaded to a target folder with:
+```
+foundry install all --checkpoint_dir <path/to/ckpt/dir>
+```
+This will download all the models supported (including multiple checkpoints of RF3) but as a beginner you can start with:
+```
+foundry install rfd3 ligandmpnn rf3 --checkpoint_dir  <path/to/ckpt/dir>
+```
+>*See `examples/all.ipynb` for how to run each model in a notebook.*
+### RFdiffusion3 (RFD3)
+[RFdiffusion3](https://www.biorxiv.org/content/10.1101/2025.09.18.676967v2) is an all-atom generative model capable of designing protein structures under complex constraints.
+> *See [models/rfd3/README.md](models/rfd3/README.md) for complete documentation.*
+<div align="center">
+  <img src="docs/_static/rfd3_trajectory.png" alt="RFdiffusion3 generation trajectory." width="400">
+</div>
+### ProteinMPNN
+[ProteinMPNN](https://www.science.org/doi/10.1126/science.add2187) and [LigandMPNN](https://www.nature.com/articles/s41592-025-02626-1) are lightweight inverse-folding models which can be use to design diverse sequences for backbones under constrained conditions.
+> *See [models/mpnn/README.md](models/mpnn/README.md) for complete documentation.*
+### RosettaFold3 (RF3)
+[RF3](https://doi.org/10.1101/2025.08.14.670328) is a structure prediction neural network that narrows the gap between closed-source AF-3 and open-source alternatives.
+<div align="center">
+  <img src="docs/_static/prot_dna.png" alt="Protein-DNA complex prediction" width="400">
+</div>
+> *See [models/rf3/README.md](models/rf3/README.md) for complete documentation.*
+---
+## Development
+### Code Organization
+**Strict dependency flow:** `foundry` → `atomworks`
+- **atomworks**: Structure I/O, preprocessing, featurization
+- **foundry**: Model architectures, training, inference endpoints
+- **models/\<model\>:** Released models.
+#### For Core Developers (Multiple Packages)
+Install both `foundry` and models in editable mode for development:
+```bash
+# Install foundry and RF3 in editable mode
+uv pip install -e . -e ./models/rf3 -e ./models/rfd3 -e ./models/mpnn
+# Or install only foundry (no models)
+uv pip install -e .
+```
+This approach allows you to:
+- Modify `foundry` shared utilities and see changes immediately
+- Work on specific models without installing all models
+- Add new models as independent packages in `models/`
+### Adding New Models
+To add a new model:
+1. Create `models/<model_name>/` directory with its own `pyproject.toml`
+2. Add `foundry` as a dependency
+3. Implement model-specific code in `models/<model_name>/src/`
+4. Users can install with: `uv pip install -e ./models/<model_name>`
+### Pre-commit Formatting
+We ship a `.pre-commit-config.yaml` that runs `make format` (via `ruff format`) before each commit. Enable it once per clone:
+```bash
+pip install pre-commit  # if not already installed
+pre-commit install
+```
+After installation the hook automatically formats the repo whenever you `git commit`. Use `pre-commit run --all-files` to apply it manually.
+## Citation
+If you use this repository code or data in your work, please cite the relavant work as below:
+```bibtex
+@article{corley2025accelerating,
+  title={Accelerating biomolecular modeling with atomworks and rf3},
+  author={Corley, Nathaniel and Mathis, Simon and Krishna, Rohith and Bauer, Magnus S and Thompson, Tuscan R and Ahern, Woody and Kazman, Maxwell W and Brent, Rafael I and Didi, Kieran and Kubaney, Andrew and others},
+  journal={bioRxiv},
+  year={2025}
+}
+@article {butcher2025_rfdiffusion3,
+    author = {Butcher, Jasper and Krishna, Rohith and Mitra, Raktim and Brent, Rafael Isaac and Li, Yanjing and Corley, Nathaniel and Kim, Paul T and Funk, Jonathan and Mathis, Simon Valentin and Salike, Saman and Muraishi, Aiko and Eisenach, Helen and Thompson, Tuscan Rock and Chen, Jie and Politanska, Yuliya and Sehgal, Enisha and Coventry, Brian and Zhang, Odin and Qiang, Bo and Didi, Kieran and Kazman, Maxwell and DiMaio, Frank and Baker, David},
+    title = {De novo Design of All-atom Biomolecular Interactions with RFdiffusion3},
+    elocation-id = {2025.09.18.676967},
+    year = {2025},
+    doi = {10.1101/2025.09.18.676967},
+    publisher = {Cold Spring Harbor Laboratory},
+    URL = {https://www.biorxiv.org/content/early/2025/11/19/2025.09.18.676967},
+    eprint = {https://www.biorxiv.org/content/early/2025/11/19/2025.09.18.676967.full.pdf},
+    journal = {bioRxiv}
+}
+@article{dauparas2022robust,
+  title={Robust deep learning--based protein sequence design using ProteinMPNN},
+  author={Dauparas, Justas and Anishchenko, Ivan and Bennett, Nathaniel and Bai, Hua and Ragotte, Robert J and Milles, Lukas F and Wicky, Basile IM and Courbet, Alexis and de Haas, Rob J and Bethel, Neville and others},
+  journal={Science},
+  volume={378},
+  number={6615},
+  pages={49--56},
+  year={2022},
+  publisher={American Association for the Advancement of Science}
+}
+@article{dauparas2025atomic,
+  title={Atomic context-conditioned protein sequence design using LigandMPNN},
+  author={Dauparas, Justas and Lee, Gyu Rie and Pecoraro, Robert and An, Linna and Anishchenko, Ivan and Glasscock, Cameron and Baker, David},
+  journal={Nature Methods},
+  pages={1--7},
+  year={2025},
+  publisher={Nature Publishing Group US New York}
+}
+```
+## Acknowledgments
+We thank Rachel Clune and Hope Woods from the RosettaCommons for their collaboration on the codebase, documentation, tutorials and examples.