PyPI - biotite - Versions diffs - 1.5.0__cp314-cp314-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl - Mend

biotite 1.5.0__cp314-cp314-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of biotite might be problematic. Click here for more details.

Files changed (354) hide show

biotite/__init__.py +18 -0
biotite/application/__init__.py +69 -0
biotite/application/application.py +276 -0
biotite/application/autodock/__init__.py +12 -0
biotite/application/autodock/app.py +500 -0
biotite/application/blast/__init__.py +14 -0
biotite/application/blast/alignment.py +92 -0
biotite/application/blast/webapp.py +428 -0
biotite/application/clustalo/__init__.py +12 -0
biotite/application/clustalo/app.py +223 -0
biotite/application/dssp/__init__.py +12 -0
biotite/application/dssp/app.py +216 -0
biotite/application/localapp.py +342 -0
biotite/application/mafft/__init__.py +12 -0
biotite/application/mafft/app.py +116 -0
biotite/application/msaapp.py +363 -0
biotite/application/muscle/__init__.py +13 -0
biotite/application/muscle/app3.py +227 -0
biotite/application/muscle/app5.py +163 -0
biotite/application/sra/__init__.py +18 -0
biotite/application/sra/app.py +447 -0
biotite/application/tantan/__init__.py +12 -0
biotite/application/tantan/app.py +199 -0
biotite/application/util.py +77 -0
biotite/application/viennarna/__init__.py +18 -0
biotite/application/viennarna/rnaalifold.py +310 -0
biotite/application/viennarna/rnafold.py +254 -0
biotite/application/viennarna/rnaplot.py +208 -0
biotite/application/viennarna/util.py +77 -0
biotite/application/webapp.py +76 -0
biotite/copyable.py +71 -0
biotite/database/__init__.py +23 -0
biotite/database/afdb/__init__.py +12 -0
biotite/database/afdb/download.py +197 -0
biotite/database/entrez/__init__.py +15 -0
biotite/database/entrez/check.py +60 -0
biotite/database/entrez/dbnames.py +101 -0
biotite/database/entrez/download.py +228 -0
biotite/database/entrez/key.py +44 -0
biotite/database/entrez/query.py +263 -0
biotite/database/error.py +16 -0
biotite/database/pubchem/__init__.py +21 -0
biotite/database/pubchem/download.py +258 -0
biotite/database/pubchem/error.py +30 -0
biotite/database/pubchem/query.py +819 -0
biotite/database/pubchem/throttle.py +98 -0
biotite/database/rcsb/__init__.py +13 -0
biotite/database/rcsb/download.py +161 -0
biotite/database/rcsb/query.py +963 -0
biotite/database/uniprot/__init__.py +13 -0
biotite/database/uniprot/check.py +40 -0
biotite/database/uniprot/download.py +126 -0
biotite/database/uniprot/query.py +292 -0
biotite/file.py +244 -0
biotite/interface/__init__.py +19 -0
biotite/interface/openmm/__init__.py +20 -0
biotite/interface/openmm/state.py +93 -0
biotite/interface/openmm/system.py +227 -0
biotite/interface/pymol/__init__.py +201 -0
biotite/interface/pymol/cgo.py +346 -0
biotite/interface/pymol/convert.py +185 -0
biotite/interface/pymol/display.py +267 -0
biotite/interface/pymol/object.py +1228 -0
biotite/interface/pymol/shapes.py +178 -0
biotite/interface/pymol/startup.py +169 -0
biotite/interface/rdkit/__init__.py +19 -0
biotite/interface/rdkit/mol.py +490 -0
biotite/interface/version.py +94 -0
biotite/interface/warning.py +19 -0
biotite/sequence/__init__.py +84 -0
biotite/sequence/align/__init__.py +199 -0
biotite/sequence/align/alignment.py +702 -0
biotite/sequence/align/banded.cpython-314-x86_64-linux-gnu.so +0 -0
biotite/sequence/align/banded.pyx +652 -0
biotite/sequence/align/buckets.py +71 -0
biotite/sequence/align/cigar.py +425 -0
biotite/sequence/align/kmeralphabet.cpython-314-x86_64-linux-gnu.so +0 -0
biotite/sequence/align/kmeralphabet.pyx +595 -0
biotite/sequence/align/kmersimilarity.cpython-314-x86_64-linux-gnu.so +0 -0
biotite/sequence/align/kmersimilarity.pyx +233 -0
biotite/sequence/align/kmertable.cpython-314-x86_64-linux-gnu.so +0 -0
biotite/sequence/align/kmertable.pyx +3411 -0
biotite/sequence/align/localgapped.cpython-314-x86_64-linux-gnu.so +0 -0
biotite/sequence/align/localgapped.pyx +892 -0
biotite/sequence/align/localungapped.cpython-314-x86_64-linux-gnu.so +0 -0
biotite/sequence/align/localungapped.pyx +279 -0
biotite/sequence/align/matrix.py +631 -0
biotite/sequence/align/matrix_data/3Di.mat +24 -0
biotite/sequence/align/matrix_data/BLOSUM100.mat +31 -0
biotite/sequence/align/matrix_data/BLOSUM30.mat +31 -0
biotite/sequence/align/matrix_data/BLOSUM35.mat +31 -0
biotite/sequence/align/matrix_data/BLOSUM40.mat +31 -0
biotite/sequence/align/matrix_data/BLOSUM45.mat +31 -0
biotite/sequence/align/matrix_data/BLOSUM50.mat +31 -0
biotite/sequence/align/matrix_data/BLOSUM50_13p.mat +25 -0
biotite/sequence/align/matrix_data/BLOSUM50_14.3.mat +25 -0
biotite/sequence/align/matrix_data/BLOSUM50_5.0.mat +25 -0
biotite/sequence/align/matrix_data/BLOSUM55.mat +31 -0
biotite/sequence/align/matrix_data/BLOSUM60.mat +31 -0
biotite/sequence/align/matrix_data/BLOSUM62.mat +31 -0
biotite/sequence/align/matrix_data/BLOSUM62_13p.mat +25 -0
biotite/sequence/align/matrix_data/BLOSUM62_14.3.mat +25 -0
biotite/sequence/align/matrix_data/BLOSUM62_5.0.mat +25 -0
biotite/sequence/align/matrix_data/BLOSUM65.mat +31 -0
biotite/sequence/align/matrix_data/BLOSUM70.mat +31 -0
biotite/sequence/align/matrix_data/BLOSUM75.mat +31 -0
biotite/sequence/align/matrix_data/BLOSUM80.mat +31 -0
biotite/sequence/align/matrix_data/BLOSUM85.mat +31 -0
biotite/sequence/align/matrix_data/BLOSUM90.mat +31 -0
biotite/sequence/align/matrix_data/BLOSUMN.mat +31 -0
biotite/sequence/align/matrix_data/CorBLOSUM49_5.0.mat +25 -0
biotite/sequence/align/matrix_data/CorBLOSUM57_13p.mat +25 -0
biotite/sequence/align/matrix_data/CorBLOSUM57_14.3.mat +25 -0
biotite/sequence/align/matrix_data/CorBLOSUM61_5.0.mat +25 -0
biotite/sequence/align/matrix_data/CorBLOSUM66_13p.mat +25 -0
biotite/sequence/align/matrix_data/CorBLOSUM67_14.3.mat +25 -0
biotite/sequence/align/matrix_data/DAYHOFF.mat +32 -0
biotite/sequence/align/matrix_data/GONNET.mat +26 -0
biotite/sequence/align/matrix_data/IDENTITY.mat +25 -0
biotite/sequence/align/matrix_data/MATCH.mat +25 -0
biotite/sequence/align/matrix_data/NUC.mat +25 -0
biotite/sequence/align/matrix_data/PAM10.mat +34 -0
biotite/sequence/align/matrix_data/PAM100.mat +34 -0
biotite/sequence/align/matrix_data/PAM110.mat +34 -0
biotite/sequence/align/matrix_data/PAM120.mat +34 -0
biotite/sequence/align/matrix_data/PAM130.mat +34 -0
biotite/sequence/align/matrix_data/PAM140.mat +34 -0
biotite/sequence/align/matrix_data/PAM150.mat +34 -0
biotite/sequence/align/matrix_data/PAM160.mat +34 -0
biotite/sequence/align/matrix_data/PAM170.mat +34 -0
biotite/sequence/align/matrix_data/PAM180.mat +34 -0
biotite/sequence/align/matrix_data/PAM190.mat +34 -0
biotite/sequence/align/matrix_data/PAM20.mat +34 -0
biotite/sequence/align/matrix_data/PAM200.mat +34 -0
biotite/sequence/align/matrix_data/PAM210.mat +34 -0
biotite/sequence/align/matrix_data/PAM220.mat +34 -0
biotite/sequence/align/matrix_data/PAM230.mat +34 -0
biotite/sequence/align/matrix_data/PAM240.mat +34 -0
biotite/sequence/align/matrix_data/PAM250.mat +34 -0
biotite/sequence/align/matrix_data/PAM260.mat +34 -0
biotite/sequence/align/matrix_data/PAM270.mat +34 -0
biotite/sequence/align/matrix_data/PAM280.mat +34 -0
biotite/sequence/align/matrix_data/PAM290.mat +34 -0
biotite/sequence/align/matrix_data/PAM30.mat +34 -0
biotite/sequence/align/matrix_data/PAM300.mat +34 -0
biotite/sequence/align/matrix_data/PAM310.mat +34 -0
biotite/sequence/align/matrix_data/PAM320.mat +34 -0
biotite/sequence/align/matrix_data/PAM330.mat +34 -0
biotite/sequence/align/matrix_data/PAM340.mat +34 -0
biotite/sequence/align/matrix_data/PAM350.mat +34 -0
biotite/sequence/align/matrix_data/PAM360.mat +34 -0
biotite/sequence/align/matrix_data/PAM370.mat +34 -0
biotite/sequence/align/matrix_data/PAM380.mat +34 -0
biotite/sequence/align/matrix_data/PAM390.mat +34 -0
biotite/sequence/align/matrix_data/PAM40.mat +34 -0
biotite/sequence/align/matrix_data/PAM400.mat +34 -0
biotite/sequence/align/matrix_data/PAM410.mat +34 -0
biotite/sequence/align/matrix_data/PAM420.mat +34 -0
biotite/sequence/align/matrix_data/PAM430.mat +34 -0
biotite/sequence/align/matrix_data/PAM440.mat +34 -0
biotite/sequence/align/matrix_data/PAM450.mat +34 -0
biotite/sequence/align/matrix_data/PAM460.mat +34 -0
biotite/sequence/align/matrix_data/PAM470.mat +34 -0
biotite/sequence/align/matrix_data/PAM480.mat +34 -0
biotite/sequence/align/matrix_data/PAM490.mat +34 -0
biotite/sequence/align/matrix_data/PAM50.mat +34 -0
biotite/sequence/align/matrix_data/PAM500.mat +34 -0
biotite/sequence/align/matrix_data/PAM60.mat +34 -0
biotite/sequence/align/matrix_data/PAM70.mat +34 -0
biotite/sequence/align/matrix_data/PAM80.mat +34 -0
biotite/sequence/align/matrix_data/PAM90.mat +34 -0
biotite/sequence/align/matrix_data/PB.license +21 -0
biotite/sequence/align/matrix_data/PB.mat +18 -0
biotite/sequence/align/matrix_data/RBLOSUM52_5.0.mat +25 -0
biotite/sequence/align/matrix_data/RBLOSUM59_13p.mat +25 -0
biotite/sequence/align/matrix_data/RBLOSUM59_14.3.mat +25 -0
biotite/sequence/align/matrix_data/RBLOSUM64_5.0.mat +25 -0
biotite/sequence/align/matrix_data/RBLOSUM69_13p.mat +25 -0
biotite/sequence/align/matrix_data/RBLOSUM69_14.3.mat +25 -0
biotite/sequence/align/multiple.cpython-314-x86_64-linux-gnu.so +0 -0
biotite/sequence/align/multiple.pyx +619 -0
biotite/sequence/align/pairwise.cpython-314-x86_64-linux-gnu.so +0 -0
biotite/sequence/align/pairwise.pyx +585 -0
biotite/sequence/align/permutation.cpython-314-x86_64-linux-gnu.so +0 -0
biotite/sequence/align/permutation.pyx +313 -0
biotite/sequence/align/primes.txt +821 -0
biotite/sequence/align/selector.cpython-314-x86_64-linux-gnu.so +0 -0
biotite/sequence/align/selector.pyx +954 -0
biotite/sequence/align/statistics.py +264 -0
biotite/sequence/align/tracetable.cpython-314-x86_64-linux-gnu.so +0 -0
biotite/sequence/align/tracetable.pxd +64 -0
biotite/sequence/align/tracetable.pyx +370 -0
biotite/sequence/alphabet.py +555 -0
biotite/sequence/annotation.py +836 -0
biotite/sequence/codec.cpython-314-x86_64-linux-gnu.so +0 -0
biotite/sequence/codec.pyx +155 -0
biotite/sequence/codon.py +476 -0
biotite/sequence/codon_tables.txt +202 -0
biotite/sequence/graphics/__init__.py +33 -0
biotite/sequence/graphics/alignment.py +1101 -0
biotite/sequence/graphics/color_schemes/3di_flower.json +48 -0
biotite/sequence/graphics/color_schemes/autumn.json +51 -0
biotite/sequence/graphics/color_schemes/blossom.json +51 -0
biotite/sequence/graphics/color_schemes/clustalx_dna.json +11 -0
biotite/sequence/graphics/color_schemes/clustalx_protein.json +28 -0
biotite/sequence/graphics/color_schemes/flower.json +51 -0
biotite/sequence/graphics/color_schemes/jalview_buried.json +31 -0
biotite/sequence/graphics/color_schemes/jalview_hydrophobicity.json +31 -0
biotite/sequence/graphics/color_schemes/jalview_prop_helix.json +31 -0
biotite/sequence/graphics/color_schemes/jalview_prop_strand.json +31 -0
biotite/sequence/graphics/color_schemes/jalview_prop_turn.json +31 -0
biotite/sequence/graphics/color_schemes/jalview_taylor.json +28 -0
biotite/sequence/graphics/color_schemes/jalview_zappo.json +28 -0
biotite/sequence/graphics/color_schemes/ocean.json +51 -0
biotite/sequence/graphics/color_schemes/pb_flower.json +40 -0
biotite/sequence/graphics/color_schemes/rainbow_dna.json +11 -0
biotite/sequence/graphics/color_schemes/rainbow_protein.json +30 -0
biotite/sequence/graphics/color_schemes/spring.json +51 -0
biotite/sequence/graphics/color_schemes/sunset.json +51 -0
biotite/sequence/graphics/color_schemes/wither.json +51 -0
biotite/sequence/graphics/colorschemes.py +170 -0
biotite/sequence/graphics/dendrogram.py +231 -0
biotite/sequence/graphics/features.py +544 -0
biotite/sequence/graphics/logo.py +102 -0
biotite/sequence/graphics/plasmid.py +712 -0
biotite/sequence/io/__init__.py +12 -0
biotite/sequence/io/fasta/__init__.py +22 -0
biotite/sequence/io/fasta/convert.py +283 -0
biotite/sequence/io/fasta/file.py +265 -0
biotite/sequence/io/fastq/__init__.py +19 -0
biotite/sequence/io/fastq/convert.py +117 -0
biotite/sequence/io/fastq/file.py +507 -0
biotite/sequence/io/genbank/__init__.py +17 -0
biotite/sequence/io/genbank/annotation.py +269 -0
biotite/sequence/io/genbank/file.py +573 -0
biotite/sequence/io/genbank/metadata.py +336 -0
biotite/sequence/io/genbank/sequence.py +173 -0
biotite/sequence/io/general.py +201 -0
biotite/sequence/io/gff/__init__.py +26 -0
biotite/sequence/io/gff/convert.py +128 -0
biotite/sequence/io/gff/file.py +449 -0
biotite/sequence/phylo/__init__.py +36 -0
biotite/sequence/phylo/nj.cpython-314-x86_64-linux-gnu.so +0 -0
biotite/sequence/phylo/nj.pyx +221 -0
biotite/sequence/phylo/tree.cpython-314-x86_64-linux-gnu.so +0 -0
biotite/sequence/phylo/tree.pyx +1169 -0
biotite/sequence/phylo/upgma.cpython-314-x86_64-linux-gnu.so +0 -0
biotite/sequence/phylo/upgma.pyx +164 -0
biotite/sequence/profile.py +561 -0
biotite/sequence/search.py +117 -0
biotite/sequence/seqtypes.py +720 -0
biotite/sequence/sequence.py +373 -0
biotite/setup_ccd.py +197 -0
biotite/structure/__init__.py +135 -0
biotite/structure/alphabet/__init__.py +25 -0
biotite/structure/alphabet/encoder.py +332 -0
biotite/structure/alphabet/encoder_weights_3di.kerasify +0 -0
biotite/structure/alphabet/i3d.py +109 -0
biotite/structure/alphabet/layers.py +86 -0
biotite/structure/alphabet/pb.license +21 -0
biotite/structure/alphabet/pb.py +170 -0
biotite/structure/alphabet/unkerasify.py +128 -0
biotite/structure/atoms.py +1562 -0
biotite/structure/basepairs.py +1403 -0
biotite/structure/bonds.cpython-314-x86_64-linux-gnu.so +0 -0
biotite/structure/bonds.pyx +2036 -0
biotite/structure/box.py +724 -0
biotite/structure/celllist.cpython-314-x86_64-linux-gnu.so +0 -0
biotite/structure/celllist.pyx +864 -0
biotite/structure/chains.py +310 -0
biotite/structure/charges.cpython-314-x86_64-linux-gnu.so +0 -0
biotite/structure/charges.pyx +520 -0
biotite/structure/compare.py +683 -0
biotite/structure/density.py +109 -0
biotite/structure/dotbracket.py +213 -0
biotite/structure/error.py +39 -0
biotite/structure/filter.py +591 -0
biotite/structure/geometry.py +817 -0
biotite/structure/graphics/__init__.py +13 -0
biotite/structure/graphics/atoms.py +243 -0
biotite/structure/graphics/rna.py +298 -0
biotite/structure/hbond.py +425 -0
biotite/structure/info/__init__.py +24 -0
biotite/structure/info/atom_masses.json +121 -0
biotite/structure/info/atoms.py +98 -0
biotite/structure/info/bonds.py +149 -0
biotite/structure/info/ccd.py +200 -0
biotite/structure/info/components.bcif +0 -0
biotite/structure/info/groups.py +128 -0
biotite/structure/info/masses.py +121 -0
biotite/structure/info/misc.py +137 -0
biotite/structure/info/radii.py +267 -0
biotite/structure/info/standardize.py +185 -0
biotite/structure/integrity.py +213 -0
biotite/structure/io/__init__.py +29 -0
biotite/structure/io/dcd/__init__.py +13 -0
biotite/structure/io/dcd/file.py +67 -0
biotite/structure/io/general.py +243 -0
biotite/structure/io/gro/__init__.py +14 -0
biotite/structure/io/gro/file.py +343 -0
biotite/structure/io/mol/__init__.py +20 -0
biotite/structure/io/mol/convert.py +112 -0
biotite/structure/io/mol/ctab.py +420 -0
biotite/structure/io/mol/header.py +120 -0
biotite/structure/io/mol/mol.py +149 -0
biotite/structure/io/mol/sdf.py +940 -0
biotite/structure/io/netcdf/__init__.py +13 -0
biotite/structure/io/netcdf/file.py +64 -0
biotite/structure/io/pdb/__init__.py +20 -0
biotite/structure/io/pdb/convert.py +389 -0
biotite/structure/io/pdb/file.py +1380 -0
biotite/structure/io/pdb/hybrid36.cpython-314-x86_64-linux-gnu.so +0 -0
biotite/structure/io/pdb/hybrid36.pyx +242 -0
biotite/structure/io/pdbqt/__init__.py +15 -0
biotite/structure/io/pdbqt/convert.py +113 -0
biotite/structure/io/pdbqt/file.py +688 -0
biotite/structure/io/pdbx/__init__.py +23 -0
biotite/structure/io/pdbx/bcif.py +674 -0
biotite/structure/io/pdbx/cif.py +1091 -0
biotite/structure/io/pdbx/component.py +251 -0
biotite/structure/io/pdbx/compress.py +362 -0
biotite/structure/io/pdbx/convert.py +2113 -0
biotite/structure/io/pdbx/encoding.cpython-314-x86_64-linux-gnu.so +0 -0
biotite/structure/io/pdbx/encoding.pyx +1078 -0
biotite/structure/io/trajfile.py +696 -0
biotite/structure/io/trr/__init__.py +13 -0
biotite/structure/io/trr/file.py +43 -0
biotite/structure/io/util.py +38 -0
biotite/structure/io/xtc/__init__.py +13 -0
biotite/structure/io/xtc/file.py +43 -0
biotite/structure/mechanics.py +72 -0
biotite/structure/molecules.py +337 -0
biotite/structure/pseudoknots.py +622 -0
biotite/structure/rdf.py +245 -0
biotite/structure/repair.py +302 -0
biotite/structure/residues.py +716 -0
biotite/structure/rings.py +451 -0
biotite/structure/sasa.cpython-314-x86_64-linux-gnu.so +0 -0
biotite/structure/sasa.pyx +322 -0
biotite/structure/segments.py +328 -0
biotite/structure/sequence.py +110 -0
biotite/structure/spacegroups.json +1567 -0
biotite/structure/spacegroups.license +26 -0
biotite/structure/sse.py +306 -0
biotite/structure/superimpose.py +511 -0
biotite/structure/tm.py +581 -0
biotite/structure/transform.py +736 -0
biotite/structure/util.py +160 -0
biotite/version.py +34 -0
biotite/visualize.py +375 -0
biotite-1.5.0.dist-info/METADATA +162 -0
biotite-1.5.0.dist-info/RECORD +354 -0
biotite-1.5.0.dist-info/WHEEL +6 -0
biotite-1.5.0.dist-info/licenses/LICENSE.rst +30 -0

biotite/structure/hbond.py ADDED Viewed

@@ -0,0 +1,425 @@
+# This source code is part of the Biotite package and is distributed
+# under the 3-Clause BSD License. Please see 'LICENSE.rst' for further
+# information.
+"""
+This module provides functions for hydrogen bonding calculation.
+"""
+__name__ = "biotite.structure"
+__author__ = "Daniel Bauer, Patrick Kunzmann"
+__all__ = ["hbond", "hbond_frequency"]
+import warnings
+import numpy as np
+from biotite.structure.atoms import AtomArrayStack, stack
+from biotite.structure.celllist import CellList
+from biotite.structure.geometry import angle, distance
+def hbond(
+    atoms,
+    selection1=None,
+    selection2=None,
+    selection1_type="both",
+    cutoff_dist=2.5,
+    cutoff_angle=120,
+    donor_elements=("O", "N", "S"),
+    acceptor_elements=("O", "N", "S"),
+    periodic=False,
+):
+    r"""
+    Find hydrogen bonds in a structure using the Baker-Hubbard
+    algorithm. :footcite:`Baker1984`
+    This function identifies hydrogen bonds based on the bond angle
+    :math:`\theta` and the bond distance :math:`d_{H,A}`.
+    The default criteria is :math:`\theta > 120^{\circ}`
+    and :math:`d_{H,A} \le 2.5 \mathring{A}`.
+    Consequently, the given structure must contain hydrogen atoms.
+    Otherwise, no hydrogen bonds will be found.
+    Parameters
+    ----------
+    atoms : AtomArray or AtomArrayStack
+        The atoms to find hydrogen bonds in.
+    selection1, selection2 : ndarray, optional
+        Boolean mask for atoms to limit the hydrogen bond search to
+        specific sections of the model. The shape must match the
+        shape of the `atoms` argument. If None is given, the whole atoms
+        stack is used instead.
+    selection1_type : {'acceptor', 'donor', 'both'}, optional
+        Determines the type of `selection1`.
+        The type of `selection2` is chosen accordingly
+        ('both' or the opposite).
+    cutoff_dist : float, optional
+        The maximal distance between the hydrogen and acceptor to be
+        considered a hydrogen bond.
+    cutoff_angle : float, optional
+        The angle cutoff in degree between Donor-H..Acceptor to be
+        considered a hydrogen bond.
+    donor_elements, acceptor_elements : tuple of str
+        Elements to be considered as possible donors or acceptors.
+    periodic : bool, optional
+        If true, hydrogen bonds can also be detected in periodic
+        boundary conditions.
+        The `box` attribute of `atoms` is required in this case.
+    Returns
+    -------
+    triplets : ndarray, dtype=int, shape=(n,3)
+        *n x 3* matrix containing the indices of every Donor-H..Acceptor
+        interaction that is available in any of the models.
+        *n* is the number of found interactions.
+        The three matrix columns are *D_index*, *H_index*, *A_index*.
+        If only one model (`AtomArray`) is given, `triplets` contains
+        all of its hydrogen bonds.
+    mask : ndarry, dtype=bool, shape=(m,n)
+        *m x n* matrix that shows if an interaction with index *n* in
+        `triplets` is present in the model *m* of the input `atoms`.
+        Only returned if `atoms` is an :class:`AtomArrayStack`.
+    See Also
+    --------
+    hbond_frequency : Compute the frequency of each bond over the models.
+    Notes
+    -----
+    The result of this function may include false positives:
+    Only the chemical elements and the bond geometry is checked.
+    However, there are some cases where a hydrogen bond is still not
+    reasonable.
+    For example, a nitrogen atom with positive charge could be
+    considered as acceptor atom by this method, although this does
+    make sense from a chemical perspective.
+    References
+    ----------
+    .. footbibliography::
+    Examples
+    --------
+    Calculate the total number of hydrogen bonds found in each model:
+    >>> triplets, mask = hbond(atom_array_stack)
+    >>> hbonds_per_model = np.count_nonzero(mask, axis=1)
+    >>> print(hbonds_per_model)
+    [14 14 14 12 11 12  9 13  9 14 13 13 14 11 11 12 11 14 14 13 14 13 15 17
+     14 12 15 12 12 13 13 13 12 12 11 14 10 11]
+    Get hydrogen bond donors of third model:
+    >>> # Third model -> index 2
+    >>> triplets = triplets[mask[2,:]]
+    >>> # First column contains donors
+    >>> print(atom_array_stack[2, triplets[:,0]])
+        A       5  GLN N      N        -5.009   -0.575   -1.365
+        A       6  TRP N      N        -2.154   -0.497   -1.588
+        A       7  LEU N      N        -1.520   -1.904    0.893
+        A       8  LYS N      N        -2.716   -4.413    0.176
+        A       8  LYS NZ     N        -6.352   -4.311   -4.482
+        A       9  ASP N      N        -0.694   -5.301   -1.644
+        A      11  GLY N      N         2.142   -4.244    1.916
+        A      10  GLY N      N         1.135   -6.232    0.250
+        A      14  SER OG     O         4.689   -5.759   -2.390
+        A      13  SER N      N         6.424   -5.220    3.257
+        A      14  SER N      N         6.424   -5.506    0.464
+        A      15  GLY N      N         8.320   -3.632   -0.318
+        A      16  ARG N      N         8.043   -1.206   -1.866
+        A       6  TRP NE1    N         3.420    0.332   -0.121
+    """
+    if not (atoms.element == "H").any():
+        warnings.warn(
+            "Input structure does not contain hydrogen atoms, "
+            "hence no hydrogen bonds can be identified"
+        )
+    # Create AtomArrayStack from AtomArray
+    if not isinstance(atoms, AtomArrayStack):
+        atoms = stack([atoms])
+        single_model = True
+    else:
+        single_model = False
+    if periodic:
+        box = atoms.box
+    else:
+        box = None
+    # Mask for donor/acceptor elements
+    donor_element_mask = np.isin(atoms.element, donor_elements)
+    acceptor_element_mask = np.isin(atoms.element, acceptor_elements)
+    if selection1 is None:
+        selection1 = np.ones(atoms.array_length(), dtype=bool)
+    if selection2 is None:
+        selection2 = np.ones(atoms.array_length(), dtype=bool)
+    if selection1_type == "both":
+        # The two selections are separated into three selections:
+        # the original ones without the overlaping part
+        # and one containing the overlap
+        # This prevents redundant triplets and unnecessary computation
+        overlap_selection = selection1 & selection2
+        # Original selections without overlaping part
+        exclusive_selection1 = selection1 & (~overlap_selection)
+        exclusive_selection2 = selection2 & (~overlap_selection)
+        # Put selections to list for cleaner iteration
+        selections = [exclusive_selection1, exclusive_selection2, overlap_selection]
+        selection_combinations = [
+            # (0,0),   is not included, would be same selection
+            #         as donor and acceptor simultaneously
+            (0, 1),
+            (0, 2),
+            (1, 0),
+            # (1,1),   # same reason above
+            (1, 2),
+            (2, 0),
+            (2, 1),
+            (2, 2),  # overlaping part, combination is necessary
+        ]
+        all_comb_triplets = []
+        all_comb_mask = []
+        for selection_index1, selection_index2 in selection_combinations:
+            donor_mask = selections[selection_index1]
+            acceptor_mask = selections[selection_index2]
+            if (
+                np.count_nonzero(donor_mask) != 0
+                and np.count_nonzero(acceptor_mask) != 0
+            ):
+                # Calculate triplets and mask
+                triplets, mask = _hbond(
+                    atoms,
+                    donor_mask,
+                    acceptor_mask,
+                    donor_element_mask,
+                    acceptor_element_mask,
+                    cutoff_dist,
+                    cutoff_angle,
+                    box,
+                )
+                all_comb_triplets.append(triplets)
+                all_comb_mask.append(mask)
+        # Merge results from all combinations
+        triplets = np.concatenate(all_comb_triplets, axis=0)
+        mask = np.concatenate(all_comb_mask, axis=1)
+    elif selection1_type == "donor":
+        triplets, mask = _hbond(
+            atoms,
+            selection1,
+            selection2,
+            donor_element_mask,
+            acceptor_element_mask,
+            cutoff_dist,
+            cutoff_angle,
+            box,
+        )
+    elif selection1_type == "acceptor":
+        triplets, mask = _hbond(
+            atoms,
+            selection2,
+            selection1,
+            donor_element_mask,
+            acceptor_element_mask,
+            cutoff_dist,
+            cutoff_angle,
+            box,
+        )
+    else:
+        raise ValueError(f"Unkown selection type '{selection1_type}'")
+    if single_model:
+        # For a atom array (not stack),
+        # hbond_mask contains only 'True' values,
+        # since all interaction are in the one model
+        # -> Simply return triplets without hbond_mask
+        return triplets
+    else:
+        return triplets, mask
+def _hbond(
+    atoms,
+    donor_mask,
+    acceptor_mask,
+    donor_element_mask,
+    acceptor_element_mask,
+    cutoff_dist,
+    cutoff_angle,
+    box,
+):
+    # Filter donor/acceptor elements
+    donor_mask &= donor_element_mask
+    acceptor_mask &= acceptor_element_mask
+    first_model_box = box[0] if box is not None else None
+    if atoms.bonds is not None:
+        donor_h_mask, associated_donor_indices = _get_bonded_h(
+            atoms[0], donor_mask, atoms.bonds
+        )
+    else:
+        warnings.warn(
+            "Input structure has no associated 'BondList', "
+            "Hydrogen atoms bonded to donors are detected by distance"
+        )
+        donor_h_mask, associated_donor_indices = _get_bonded_h_via_distance(
+            atoms[0], donor_mask, first_model_box
+        )
+    donor_h_i = np.where(donor_h_mask)[0]
+    acceptor_i = np.where(acceptor_mask)[0]
+    if len(donor_h_i) == 0 or len(acceptor_i) == 0:
+        # Return empty triplets and mask
+        return (
+            np.zeros((0, 3), dtype=int),
+            np.zeros((atoms.stack_depth(), 0), dtype=bool),
+        )
+    # Narrow the amount of possible acceptor to donor-H connections
+    # down via the distance cutoff parameter using a cell list
+    # Save in acceptor-to-hydrogen matrix
+    # (true when distance smaller than cutoff)
+    coord = atoms.coord
+    possible_bonds = np.zeros((len(acceptor_i), len(donor_h_i)), dtype=bool)
+    periodic = False if box is None else True
+    for model_i in range(atoms.stack_depth()):
+        donor_h_coord = coord[model_i, donor_h_mask]
+        acceptor_coord = coord[model_i, acceptor_mask]
+        box_for_model = box[model_i] if box is not None else None
+        cell_list = CellList(
+            donor_h_coord, cell_size=cutoff_dist, periodic=periodic, box=box_for_model
+        )
+        possible_bonds |= cell_list.get_atoms_in_cells(acceptor_coord, as_mask=True)
+    possible_bonds_i = np.where(possible_bonds)
+    # Narrow down
+    acceptor_i = acceptor_i[possible_bonds_i[0]]
+    donor_h_i = donor_h_i[possible_bonds_i[1]]
+    # Build D-H..A triplets
+    donor_i = associated_donor_indices[donor_h_i]
+    triplets = np.stack((donor_i, donor_h_i, acceptor_i), axis=1)
+    # Remove entries where donor and acceptor are the same
+    triplets = triplets[donor_i != acceptor_i]
+    hbond_mask = _is_hbond(
+        coord[:, triplets[:, 0]],  # donors
+        coord[:, triplets[:, 1]],  # donor hydrogens
+        coord[:, triplets[:, 2]],  # acceptors
+        box,
+        cutoff_dist=cutoff_dist,
+        cutoff_angle=cutoff_angle,
+    )
+    # Reduce output to contain only triplets counted at least once
+    is_counted = hbond_mask.any(axis=0)
+    triplets = triplets[is_counted]
+    hbond_mask = hbond_mask[:, is_counted]
+    return triplets, hbond_mask
+def _get_bonded_h(array, donor_mask, bonds):
+    """
+    Helper function to find indices of associated hydrogens in atoms for
+    all donors in atoms[donor_mask].
+    A `BondsList` is used for detecting bonded hydrogen atoms.
+    """
+    hydrogen_mask = array.element == "H"
+    donor_hydrogen_mask = np.zeros(len(array), dtype=bool)
+    associated_donor_indices = np.full(len(array), -1, dtype=int)
+    all_bond_indices, _ = bonds.get_all_bonds()
+    donor_indices = np.where(donor_mask)[0]
+    for donor_i in donor_indices:
+        bonded_indices = all_bond_indices[donor_i]
+        # Remove padding values
+        bonded_indices = bonded_indices[bonded_indices != -1]
+        # Filter hydrogen atoms
+        bonded_indices = bonded_indices[hydrogen_mask[bonded_indices]]
+        donor_hydrogen_mask[bonded_indices] = True
+        associated_donor_indices[bonded_indices] = donor_i
+    return donor_hydrogen_mask, associated_donor_indices
+def _get_bonded_h_via_distance(array, donor_mask, box):
+    """
+    Helper function to find indices of associated hydrogens in atoms for
+    all donors in atoms[donor_mask].
+    The criterium is that the hydrogen must be in the same residue and
+    the distance must be smaller than the cutoff.
+    """
+    CUTOFF = 1.5
+    coord = array.coord
+    res_id = array.res_id
+    hydrogen_mask = array.element == "H"
+    donor_hydrogen_mask = np.zeros(len(array), dtype=bool)
+    associated_donor_indices = np.full(len(array), -1, dtype=int)
+    donor_indices = np.where(donor_mask)[0]
+    for donor_i in donor_indices:
+        candidate_mask = hydrogen_mask & (res_id == res_id[donor_i])
+        distances = distance(coord[donor_i], coord[candidate_mask], box=box)
+        donor_h_indices = np.where(candidate_mask)[0][distances <= CUTOFF]
+        for i in donor_h_indices:
+            associated_donor_indices[i] = donor_i
+            donor_hydrogen_mask[i] = True
+    return donor_hydrogen_mask, associated_donor_indices
+def _is_hbond(donor, donor_h, acceptor, box, cutoff_dist, cutoff_angle):
+    """
+    Filter triplets that meet distance and angle condition.
+    """
+    cutoff_angle_rad = np.deg2rad(cutoff_angle)
+    theta = angle(donor, donor_h, acceptor, box=box)
+    dist = distance(donor_h, acceptor, box=box)
+    return (theta > cutoff_angle_rad) & (dist <= cutoff_dist)
+def hbond_frequency(mask):
+    """
+    Get the relative frequency of each hydrogen bond in a multi-model
+    structure.
+    The frequency is the amount of models, where the respective bond
+    exists divided by the total amount of models.
+    Parameters
+    ----------
+    mask : ndarray, dtype=bool, shape=(m,n)
+        Input mask obtained from `hbond` function.
+    Returns
+    -------
+    ndarray, dtype=Float
+        For each individual interaction *n* of the mask, returns the
+        percentage of models *m*, in which this hydrogen bond is
+        present.
+    See Also
+    --------
+    hbond : Returns the mask that can be input into this function.
+    Examples
+    --------
+    >>> triplets, mask = hbond(atom_array_stack)
+    >>> freq = hbond_frequency(mask)
+    >>> print(freq)
+    [0.263 0.289 0.105 0.105 0.237 0.026 0.053 0.395 1.000 1.000 1.000 0.026
+     0.421 0.026 0.026 0.316 0.816 0.026 0.921 0.026 0.342 0.026 0.105 0.026
+     0.132 0.053 0.026 0.158 0.026 0.868 0.211 0.026 0.921 0.316 0.079 0.237
+     0.105 0.421 0.079 0.026 1.000 0.053 0.132 0.026 0.184]
+    """
+    return mask.sum(axis=0) / len(mask)

biotite/structure/info/__init__.py ADDED Viewed

@@ -0,0 +1,24 @@
+# This source code is part of the Biotite package and is distributed
+# under the 3-Clause BSD License. Please see 'LICENSE.rst' for further
+# information.
+"""
+A subpackage for obtaining all kinds of chemical information about atoms
+and residues, including masses, radii, bonds, etc.
+Most information is extracted from the *Chemical Component Dictionary*
+of the
+`wwPDB <ftp://ftp.wwpdb.org/pub/pdb/data/monomers/components.cif>`_.
+"""
+__name__ = "biotite.structure.info"
+__author__ = "Patrick Kunzmann, Tom David Müller"
+from .atoms import *
+from .bonds import *
+from .ccd import *
+from .groups import *
+from .masses import *
+from .misc import *
+from .radii import *
+from .standardize import *

biotite/structure/info/atom_masses.json ADDED Viewed

@@ -0,0 +1,121 @@
+{
+    "H"  :   1.008,
+    "D"  :   2.014,
+    "HE" :   4.002,
+    "LI" :   6.940,
+    "BE" :   9.012,
+    "B"  :  10.810,
+    "C"  :  12.011,
+    "N"  :  14.007,
+    "O"  :  15.999,
+    "F"  :  18.998,
+    "NE" :  20.180,
+    "NA" :  22.989,
+    "MG" :  24.305,
+    "AL" :  26.981,
+    "SI" :  28.085,
+    "P"  :  30.973,
+    "S"  :  32.060,
+    "CL" :  35.450,
+    "AR" :  39.948,
+    "K"  :  39.098,
+    "CA" :  40.078,
+    "SC" :  44.955,
+    "TI" :  47.867,
+    "V"  :  50.941,
+    "CR" :  51.996,
+    "MN" :  54.938,
+    "FE" :  55.845,
+    "CO" :  58.933,
+    "NI" :  58.693,
+    "CU" :  63.546,
+    "ZN" :  65.380,
+    "GA" :  69.723,
+    "GE" :  72.630,
+    "AS" :  74.921,
+    "SE" :  78.971,
+    "BR" :  79.904,
+    "KR" :  83.798,
+    "RB" :  85.468,
+    "SR" :  87.620,
+    "Y"  :  88.905,
+    "ZR" :  91.224,
+    "NB" :  92.906,
+    "MO" :  95.950,
+    "TC" :  97.000,
+    "RU" : 101.070,
+    "RH" : 102.905,
+    "PD" : 106.420,
+    "AG" : 107.868,
+    "CD" : 112.414,
+    "IN" : 114.818,
+    "SN" : 118.710,
+    "SB" : 121.760,
+    "TE" : 127.600,
+    "I"  : 126.904,
+    "XE" : 131.293,
+    "CS" : 132.905,
+    "BA" : 137.327,
+    "LA" : 138.905,
+    "CE" : 140.116,
+    "PR" : 140.907,
+    "ND" : 144.242,
+    "PM" : 145.000,
+    "SM" : 150.360,
+    "EU" : 151.964,
+    "GD" : 157.250,
+    "TB" : 158.925,
+    "DY" : 162.500,
+    "HO" : 164.930,
+    "ER" : 167.259,
+    "TM" : 168.934,
+    "YB" : 173.045,
+    "LU" : 174.967,
+    "HF" : 178.490,
+    "TA" : 180.947,
+    "W"  : 183.840,
+    "RE" : 186.207,
+    "OS" : 190.230,
+    "IR" : 192.217,
+    "PT" : 195.084,
+    "AU" : 196.966,
+    "HG" : 200.592,
+    "TL" : 204.380,
+    "PB" : 207.200,
+    "BI" : 208.980,
+    "PO" : 209.000,
+    "AT" : 210.000,
+    "RN" : 222.000,
+    "FR" : 223.000,
+    "RA" : 226.000,
+    "AC" : 227.000,
+    "TH" : 232.038,
+    "PA" : 231.035,
+    "U"  : 238.028,
+    "NP" : 237.000,
+    "PU" : 244.000,
+    "AM" : 243.000,
+    "CM" : 247.000,
+    "BK" : 247.000,
+    "CF" : 251.000,
+    "ES" : 252.000,
+    "FM" : 257.000,
+    "MD" : 258.000,
+    "NO" : 259.000,
+    "LR" : 262.000,
+    "RF" : 267.000,
+    "DB" : 270.000,
+    "SG" : 269.000,
+    "BH" : 270.000,
+    "HS" : 270.000,
+    "MT" : 278.000,
+    "DS" : 281.000,
+    "RG" : 281.000,
+    "CN" : 285.000,
+    "NH" : 286.000,
+    "FL" : 289.000,
+    "MC" : 289.000,
+    "LV" : 293.000,
+    "TS" : 293.000,
+    "OG" : 294.000
+}

biotite/structure/info/atoms.py ADDED Viewed

@@ -0,0 +1,98 @@
+# This source code is part of the Biotite package and is distributed
+# under the 3-Clause BSD License. Please see 'LICENSE.rst' for further
+# information.
+__name__ = "biotite.structure.info"
+__author__ = "Patrick Kunzmann"
+__all__ = ["residue"]
+import functools
+from biotite.structure.info.ccd import get_ccd
+# fmt: off
+NON_HETERO_RESIDUES = set([
+    "ALA", "ARG", "ASN", "ASP", "CYS", "GLN", "GLU", "GLY", "HIS",
+    "ILE", "LEU", "LYS", "MET", "PHE", "PRO", "PYL", "SER", "THR",
+    "TRP", "TYR", "VAL", "SEC",
+    "A", "DA", "G", "DG", "C", "DC", "U", "DT",
+])
+# fmt: on
+def residue(res_name, allow_missing_coord=False):
+    """
+    Get an atom array, representing the residue with the given name.
+    This atom array includes proper values for the ``residue_name``,
+    ``hetero``, ``atom_name``, ``element`` and ``charge`` annotation
+    arrays and bonds and coordinates.
+    Parameters
+    ----------
+    res_name : str
+        The up to 3-letter name of the residue.
+    allow_missing_coord : bool, optional
+        Whether to allow missing coordinate values in the residue.
+        If ``True``, these will be represented as ``nan`` values.
+        If ``False``, a ``ValueError`` is raised when missing coordinates
+        are encountered.
+    Returns
+    -------
+    atom_array : AtomArray
+        The atom array described by `res_name`.
+    Examples
+    --------
+    >>> alanine = residue("ALA")
+    >>> # Atoms and geometry
+    >>> print(alanine)
+                0  ALA N      N        -0.966    0.493    1.500
+                0  ALA CA     C         0.257    0.418    0.692
+                0  ALA C      C        -0.094    0.017   -0.716
+                0  ALA O      O        -1.056   -0.682   -0.923
+                0  ALA CB     C         1.204   -0.620    1.296
+                0  ALA OXT    O         0.661    0.439   -1.742
+                0  ALA H      H        -1.383   -0.425    1.482
+                0  ALA H2     H        -0.676    0.661    2.452
+                0  ALA HA     H         0.746    1.392    0.682
+                0  ALA HB1    H         1.459   -0.330    2.316
+                0  ALA HB2    H         0.715   -1.594    1.307
+                0  ALA HB3    H         2.113   -0.676    0.697
+                0  ALA HXT    H         0.435    0.182   -2.647
+    >>> # Bonds
+    >>> print(alanine.atom_name[alanine.bonds.as_array()[:,:2]])
+    [['N' 'CA']
+     ['N' 'H']
+     ['N' 'H2']
+     ['CA' 'C']
+     ['CA' 'CB']
+     ['CA' 'HA']
+     ['C' 'O']
+     ['C' 'OXT']
+     ['CB' 'HB1']
+     ['CB' 'HB2']
+     ['CB' 'HB3']
+     ['OXT' 'HXT']]
+    """
+    # Use a cache internally, but always return a copy,
+    # as the returned AtomArray is mutable
+    return _residue(res_name, allow_missing_coord).copy()
+@functools.lru_cache(maxsize=100)
+def _residue(res_name, allow_missing_coord=False):
+    # Avoid circular import
+    from biotite.structure.io.pdbx import get_component
+    try:
+        component = get_component(
+            get_ccd(),
+            res_name=res_name,
+            allow_missing_coord=allow_missing_coord,
+        )
+    except KeyError:
+        raise KeyError(f"No atom information found for residue '{res_name}' in CCD")
+    component.hetero[:] = res_name not in NON_HETERO_RESIDUES
+    return component