PyPI - biotite - Versions diffs - 0.41.1__cp312-cp312-macosx_10_16_arm64.whl - Mend

biotite 0.41.1__cp312-cp312-macosx_10_16_arm64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of biotite might be problematic. Click here for more details.

Files changed (340) hide show

biotite/__init__.py +19 -0
biotite/application/__init__.py +43 -0
biotite/application/application.py +265 -0
biotite/application/autodock/__init__.py +12 -0
biotite/application/autodock/app.py +505 -0
biotite/application/blast/__init__.py +14 -0
biotite/application/blast/alignment.py +83 -0
biotite/application/blast/webapp.py +421 -0
biotite/application/clustalo/__init__.py +12 -0
biotite/application/clustalo/app.py +238 -0
biotite/application/dssp/__init__.py +12 -0
biotite/application/dssp/app.py +152 -0
biotite/application/localapp.py +306 -0
biotite/application/mafft/__init__.py +12 -0
biotite/application/mafft/app.py +122 -0
biotite/application/msaapp.py +374 -0
biotite/application/muscle/__init__.py +13 -0
biotite/application/muscle/app3.py +254 -0
biotite/application/muscle/app5.py +171 -0
biotite/application/sra/__init__.py +18 -0
biotite/application/sra/app.py +456 -0
biotite/application/tantan/__init__.py +12 -0
biotite/application/tantan/app.py +222 -0
biotite/application/util.py +59 -0
biotite/application/viennarna/__init__.py +18 -0
biotite/application/viennarna/rnaalifold.py +304 -0
biotite/application/viennarna/rnafold.py +269 -0
biotite/application/viennarna/rnaplot.py +187 -0
biotite/application/viennarna/util.py +72 -0
biotite/application/webapp.py +77 -0
biotite/copyable.py +71 -0
biotite/database/__init__.py +23 -0
biotite/database/entrez/__init__.py +15 -0
biotite/database/entrez/check.py +61 -0
biotite/database/entrez/dbnames.py +89 -0
biotite/database/entrez/download.py +223 -0
biotite/database/entrez/key.py +44 -0
biotite/database/entrez/query.py +223 -0
biotite/database/error.py +15 -0
biotite/database/pubchem/__init__.py +21 -0
biotite/database/pubchem/download.py +260 -0
biotite/database/pubchem/error.py +20 -0
biotite/database/pubchem/query.py +827 -0
biotite/database/pubchem/throttle.py +99 -0
biotite/database/rcsb/__init__.py +13 -0
biotite/database/rcsb/download.py +167 -0
biotite/database/rcsb/query.py +959 -0
biotite/database/uniprot/__init__.py +13 -0
biotite/database/uniprot/check.py +32 -0
biotite/database/uniprot/download.py +134 -0
biotite/database/uniprot/query.py +209 -0
biotite/file.py +251 -0
biotite/sequence/__init__.py +73 -0
biotite/sequence/align/__init__.py +49 -0
biotite/sequence/align/alignment.py +658 -0
biotite/sequence/align/banded.cpython-312-darwin.so +0 -0
biotite/sequence/align/banded.pyx +652 -0
biotite/sequence/align/buckets.py +69 -0
biotite/sequence/align/cigar.py +434 -0
biotite/sequence/align/kmeralphabet.cpython-312-darwin.so +0 -0
biotite/sequence/align/kmeralphabet.pyx +574 -0
biotite/sequence/align/kmersimilarity.cpython-312-darwin.so +0 -0
biotite/sequence/align/kmersimilarity.pyx +233 -0
biotite/sequence/align/kmertable.cpython-312-darwin.so +0 -0
biotite/sequence/align/kmertable.pyx +3400 -0
biotite/sequence/align/localgapped.cpython-312-darwin.so +0 -0
biotite/sequence/align/localgapped.pyx +892 -0
biotite/sequence/align/localungapped.cpython-312-darwin.so +0 -0
biotite/sequence/align/localungapped.pyx +279 -0
biotite/sequence/align/matrix.py +405 -0
biotite/sequence/align/matrix_data/BLOSUM100.mat +31 -0
biotite/sequence/align/matrix_data/BLOSUM30.mat +31 -0
biotite/sequence/align/matrix_data/BLOSUM35.mat +31 -0
biotite/sequence/align/matrix_data/BLOSUM40.mat +31 -0
biotite/sequence/align/matrix_data/BLOSUM45.mat +31 -0
biotite/sequence/align/matrix_data/BLOSUM50.mat +31 -0
biotite/sequence/align/matrix_data/BLOSUM50_13p.mat +25 -0
biotite/sequence/align/matrix_data/BLOSUM50_14.3.mat +25 -0
biotite/sequence/align/matrix_data/BLOSUM50_5.0.mat +25 -0
biotite/sequence/align/matrix_data/BLOSUM55.mat +31 -0
biotite/sequence/align/matrix_data/BLOSUM60.mat +31 -0
biotite/sequence/align/matrix_data/BLOSUM62.mat +31 -0
biotite/sequence/align/matrix_data/BLOSUM62_13p.mat +25 -0
biotite/sequence/align/matrix_data/BLOSUM62_14.3.mat +25 -0
biotite/sequence/align/matrix_data/BLOSUM62_5.0.mat +25 -0
biotite/sequence/align/matrix_data/BLOSUM65.mat +31 -0
biotite/sequence/align/matrix_data/BLOSUM70.mat +31 -0
biotite/sequence/align/matrix_data/BLOSUM75.mat +31 -0
biotite/sequence/align/matrix_data/BLOSUM80.mat +31 -0
biotite/sequence/align/matrix_data/BLOSUM85.mat +31 -0
biotite/sequence/align/matrix_data/BLOSUM90.mat +31 -0
biotite/sequence/align/matrix_data/BLOSUMN.mat +31 -0
biotite/sequence/align/matrix_data/CorBLOSUM49_5.0.mat +25 -0
biotite/sequence/align/matrix_data/CorBLOSUM57_13p.mat +25 -0
biotite/sequence/align/matrix_data/CorBLOSUM57_14.3.mat +25 -0
biotite/sequence/align/matrix_data/CorBLOSUM61_5.0.mat +25 -0
biotite/sequence/align/matrix_data/CorBLOSUM66_13p.mat +25 -0
biotite/sequence/align/matrix_data/CorBLOSUM67_14.3.mat +25 -0
biotite/sequence/align/matrix_data/DAYHOFF.mat +32 -0
biotite/sequence/align/matrix_data/GONNET.mat +26 -0
biotite/sequence/align/matrix_data/IDENTITY.mat +25 -0
biotite/sequence/align/matrix_data/MATCH.mat +25 -0
biotite/sequence/align/matrix_data/NUC.mat +25 -0
biotite/sequence/align/matrix_data/PAM10.mat +34 -0
biotite/sequence/align/matrix_data/PAM100.mat +34 -0
biotite/sequence/align/matrix_data/PAM110.mat +34 -0
biotite/sequence/align/matrix_data/PAM120.mat +34 -0
biotite/sequence/align/matrix_data/PAM130.mat +34 -0
biotite/sequence/align/matrix_data/PAM140.mat +34 -0
biotite/sequence/align/matrix_data/PAM150.mat +34 -0
biotite/sequence/align/matrix_data/PAM160.mat +34 -0
biotite/sequence/align/matrix_data/PAM170.mat +34 -0
biotite/sequence/align/matrix_data/PAM180.mat +34 -0
biotite/sequence/align/matrix_data/PAM190.mat +34 -0
biotite/sequence/align/matrix_data/PAM20.mat +34 -0
biotite/sequence/align/matrix_data/PAM200.mat +34 -0
biotite/sequence/align/matrix_data/PAM210.mat +34 -0
biotite/sequence/align/matrix_data/PAM220.mat +34 -0
biotite/sequence/align/matrix_data/PAM230.mat +34 -0
biotite/sequence/align/matrix_data/PAM240.mat +34 -0
biotite/sequence/align/matrix_data/PAM250.mat +34 -0
biotite/sequence/align/matrix_data/PAM260.mat +34 -0
biotite/sequence/align/matrix_data/PAM270.mat +34 -0
biotite/sequence/align/matrix_data/PAM280.mat +34 -0
biotite/sequence/align/matrix_data/PAM290.mat +34 -0
biotite/sequence/align/matrix_data/PAM30.mat +34 -0
biotite/sequence/align/matrix_data/PAM300.mat +34 -0
biotite/sequence/align/matrix_data/PAM310.mat +34 -0
biotite/sequence/align/matrix_data/PAM320.mat +34 -0
biotite/sequence/align/matrix_data/PAM330.mat +34 -0
biotite/sequence/align/matrix_data/PAM340.mat +34 -0
biotite/sequence/align/matrix_data/PAM350.mat +34 -0
biotite/sequence/align/matrix_data/PAM360.mat +34 -0
biotite/sequence/align/matrix_data/PAM370.mat +34 -0
biotite/sequence/align/matrix_data/PAM380.mat +34 -0
biotite/sequence/align/matrix_data/PAM390.mat +34 -0
biotite/sequence/align/matrix_data/PAM40.mat +34 -0
biotite/sequence/align/matrix_data/PAM400.mat +34 -0
biotite/sequence/align/matrix_data/PAM410.mat +34 -0
biotite/sequence/align/matrix_data/PAM420.mat +34 -0
biotite/sequence/align/matrix_data/PAM430.mat +34 -0
biotite/sequence/align/matrix_data/PAM440.mat +34 -0
biotite/sequence/align/matrix_data/PAM450.mat +34 -0
biotite/sequence/align/matrix_data/PAM460.mat +34 -0
biotite/sequence/align/matrix_data/PAM470.mat +34 -0
biotite/sequence/align/matrix_data/PAM480.mat +34 -0
biotite/sequence/align/matrix_data/PAM490.mat +34 -0
biotite/sequence/align/matrix_data/PAM50.mat +34 -0
biotite/sequence/align/matrix_data/PAM500.mat +34 -0
biotite/sequence/align/matrix_data/PAM60.mat +34 -0
biotite/sequence/align/matrix_data/PAM70.mat +34 -0
biotite/sequence/align/matrix_data/PAM80.mat +34 -0
biotite/sequence/align/matrix_data/PAM90.mat +34 -0
biotite/sequence/align/matrix_data/RBLOSUM52_5.0.mat +25 -0
biotite/sequence/align/matrix_data/RBLOSUM59_13p.mat +25 -0
biotite/sequence/align/matrix_data/RBLOSUM59_14.3.mat +25 -0
biotite/sequence/align/matrix_data/RBLOSUM64_5.0.mat +25 -0
biotite/sequence/align/matrix_data/RBLOSUM69_13p.mat +25 -0
biotite/sequence/align/matrix_data/RBLOSUM69_14.3.mat +25 -0
biotite/sequence/align/multiple.cpython-312-darwin.so +0 -0
biotite/sequence/align/multiple.pyx +620 -0
biotite/sequence/align/pairwise.cpython-312-darwin.so +0 -0
biotite/sequence/align/pairwise.pyx +587 -0
biotite/sequence/align/permutation.cpython-312-darwin.so +0 -0
biotite/sequence/align/permutation.pyx +305 -0
biotite/sequence/align/primes.txt +821 -0
biotite/sequence/align/selector.cpython-312-darwin.so +0 -0
biotite/sequence/align/selector.pyx +956 -0
biotite/sequence/align/statistics.py +265 -0
biotite/sequence/align/tracetable.cpython-312-darwin.so +0 -0
biotite/sequence/align/tracetable.pxd +64 -0
biotite/sequence/align/tracetable.pyx +370 -0
biotite/sequence/alphabet.py +566 -0
biotite/sequence/annotation.py +829 -0
biotite/sequence/codec.cpython-312-darwin.so +0 -0
biotite/sequence/codec.pyx +155 -0
biotite/sequence/codon.py +466 -0
biotite/sequence/codon_tables.txt +202 -0
biotite/sequence/graphics/__init__.py +33 -0
biotite/sequence/graphics/alignment.py +1034 -0
biotite/sequence/graphics/color_schemes/autumn.json +51 -0
biotite/sequence/graphics/color_schemes/blossom.json +51 -0
biotite/sequence/graphics/color_schemes/clustalx_dna.json +11 -0
biotite/sequence/graphics/color_schemes/clustalx_protein.json +28 -0
biotite/sequence/graphics/color_schemes/flower.json +51 -0
biotite/sequence/graphics/color_schemes/jalview_buried.json +31 -0
biotite/sequence/graphics/color_schemes/jalview_hydrophobicity.json +31 -0
biotite/sequence/graphics/color_schemes/jalview_prop_helix.json +31 -0
biotite/sequence/graphics/color_schemes/jalview_prop_strand.json +31 -0
biotite/sequence/graphics/color_schemes/jalview_prop_turn.json +31 -0
biotite/sequence/graphics/color_schemes/jalview_taylor.json +28 -0
biotite/sequence/graphics/color_schemes/jalview_zappo.json +28 -0
biotite/sequence/graphics/color_schemes/ocean.json +51 -0
biotite/sequence/graphics/color_schemes/pb_flower.json +39 -0
biotite/sequence/graphics/color_schemes/rainbow_dna.json +11 -0
biotite/sequence/graphics/color_schemes/rainbow_protein.json +30 -0
biotite/sequence/graphics/color_schemes/spring.json +51 -0
biotite/sequence/graphics/color_schemes/sunset.json +51 -0
biotite/sequence/graphics/color_schemes/wither.json +51 -0
biotite/sequence/graphics/colorschemes.py +139 -0
biotite/sequence/graphics/dendrogram.py +184 -0
biotite/sequence/graphics/features.py +510 -0
biotite/sequence/graphics/logo.py +110 -0
biotite/sequence/graphics/plasmid.py +661 -0
biotite/sequence/io/__init__.py +12 -0
biotite/sequence/io/fasta/__init__.py +22 -0
biotite/sequence/io/fasta/convert.py +273 -0
biotite/sequence/io/fasta/file.py +278 -0
biotite/sequence/io/fastq/__init__.py +19 -0
biotite/sequence/io/fastq/convert.py +120 -0
biotite/sequence/io/fastq/file.py +551 -0
biotite/sequence/io/genbank/__init__.py +17 -0
biotite/sequence/io/genbank/annotation.py +277 -0
biotite/sequence/io/genbank/file.py +575 -0
biotite/sequence/io/genbank/metadata.py +324 -0
biotite/sequence/io/genbank/sequence.py +172 -0
biotite/sequence/io/general.py +192 -0
biotite/sequence/io/gff/__init__.py +26 -0
biotite/sequence/io/gff/convert.py +133 -0
biotite/sequence/io/gff/file.py +434 -0
biotite/sequence/phylo/__init__.py +36 -0
biotite/sequence/phylo/nj.cpython-312-darwin.so +0 -0
biotite/sequence/phylo/nj.pyx +221 -0
biotite/sequence/phylo/tree.cpython-312-darwin.so +0 -0
biotite/sequence/phylo/tree.pyx +1169 -0
biotite/sequence/phylo/upgma.cpython-312-darwin.so +0 -0
biotite/sequence/phylo/upgma.pyx +164 -0
biotite/sequence/profile.py +456 -0
biotite/sequence/search.py +116 -0
biotite/sequence/seqtypes.py +556 -0
biotite/sequence/sequence.py +374 -0
biotite/structure/__init__.py +132 -0
biotite/structure/atoms.py +1455 -0
biotite/structure/basepairs.py +1415 -0
biotite/structure/bonds.cpython-312-darwin.so +0 -0
biotite/structure/bonds.pyx +1933 -0
biotite/structure/box.py +592 -0
biotite/structure/celllist.cpython-312-darwin.so +0 -0
biotite/structure/celllist.pyx +849 -0
biotite/structure/chains.py +298 -0
biotite/structure/charges.cpython-312-darwin.so +0 -0
biotite/structure/charges.pyx +520 -0
biotite/structure/compare.py +274 -0
biotite/structure/density.py +114 -0
biotite/structure/dotbracket.py +216 -0
biotite/structure/error.py +31 -0
biotite/structure/filter.py +585 -0
biotite/structure/geometry.py +697 -0
biotite/structure/graphics/__init__.py +13 -0
biotite/structure/graphics/atoms.py +226 -0
biotite/structure/graphics/rna.py +282 -0
biotite/structure/hbond.py +409 -0
biotite/structure/info/__init__.py +25 -0
biotite/structure/info/atom_masses.json +121 -0
biotite/structure/info/atoms.py +82 -0
biotite/structure/info/bonds.py +145 -0
biotite/structure/info/ccd/README.rst +8 -0
biotite/structure/info/ccd/amino_acids.txt +1663 -0
biotite/structure/info/ccd/carbohydrates.txt +1135 -0
biotite/structure/info/ccd/components.bcif +0 -0
biotite/structure/info/ccd/nucleotides.txt +798 -0
biotite/structure/info/ccd.py +95 -0
biotite/structure/info/groups.py +90 -0
biotite/structure/info/masses.py +123 -0
biotite/structure/info/misc.py +144 -0
biotite/structure/info/radii.py +197 -0
biotite/structure/info/standardize.py +196 -0
biotite/structure/integrity.py +268 -0
biotite/structure/io/__init__.py +30 -0
biotite/structure/io/ctab.py +72 -0
biotite/structure/io/dcd/__init__.py +13 -0
biotite/structure/io/dcd/file.py +65 -0
biotite/structure/io/general.py +257 -0
biotite/structure/io/gro/__init__.py +14 -0
biotite/structure/io/gro/file.py +343 -0
biotite/structure/io/mmtf/__init__.py +21 -0
biotite/structure/io/mmtf/assembly.py +214 -0
biotite/structure/io/mmtf/convertarray.cpython-312-darwin.so +0 -0
biotite/structure/io/mmtf/convertarray.pyx +341 -0
biotite/structure/io/mmtf/convertfile.cpython-312-darwin.so +0 -0
biotite/structure/io/mmtf/convertfile.pyx +501 -0
biotite/structure/io/mmtf/decode.cpython-312-darwin.so +0 -0
biotite/structure/io/mmtf/decode.pyx +152 -0
biotite/structure/io/mmtf/encode.cpython-312-darwin.so +0 -0
biotite/structure/io/mmtf/encode.pyx +183 -0
biotite/structure/io/mmtf/file.py +233 -0
biotite/structure/io/mol/__init__.py +20 -0
biotite/structure/io/mol/convert.py +115 -0
biotite/structure/io/mol/ctab.py +414 -0
biotite/structure/io/mol/header.py +116 -0
biotite/structure/io/mol/mol.py +193 -0
biotite/structure/io/mol/sdf.py +916 -0
biotite/structure/io/netcdf/__init__.py +13 -0
biotite/structure/io/netcdf/file.py +63 -0
biotite/structure/io/npz/__init__.py +20 -0
biotite/structure/io/npz/file.py +152 -0
biotite/structure/io/pdb/__init__.py +20 -0
biotite/structure/io/pdb/convert.py +293 -0
biotite/structure/io/pdb/file.py +1240 -0
biotite/structure/io/pdb/hybrid36.cpython-312-darwin.so +0 -0
biotite/structure/io/pdb/hybrid36.pyx +242 -0
biotite/structure/io/pdbqt/__init__.py +15 -0
biotite/structure/io/pdbqt/convert.py +107 -0
biotite/structure/io/pdbqt/file.py +640 -0
biotite/structure/io/pdbx/__init__.py +23 -0
biotite/structure/io/pdbx/bcif.py +648 -0
biotite/structure/io/pdbx/cif.py +1032 -0
biotite/structure/io/pdbx/component.py +246 -0
biotite/structure/io/pdbx/convert.py +1597 -0
biotite/structure/io/pdbx/encoding.cpython-312-darwin.so +0 -0
biotite/structure/io/pdbx/encoding.pyx +950 -0
biotite/structure/io/pdbx/legacy.py +267 -0
biotite/structure/io/tng/__init__.py +13 -0
biotite/structure/io/tng/file.py +46 -0
biotite/structure/io/trajfile.py +710 -0
biotite/structure/io/trr/__init__.py +13 -0
biotite/structure/io/trr/file.py +46 -0
biotite/structure/io/xtc/__init__.py +13 -0
biotite/structure/io/xtc/file.py +46 -0
biotite/structure/mechanics.py +75 -0
biotite/structure/molecules.py +353 -0
biotite/structure/pseudoknots.py +642 -0
biotite/structure/rdf.py +243 -0
biotite/structure/repair.py +253 -0
biotite/structure/residues.py +562 -0
biotite/structure/resutil.py +178 -0
biotite/structure/sasa.cpython-312-darwin.so +0 -0
biotite/structure/sasa.pyx +322 -0
biotite/structure/sequence.py +112 -0
biotite/structure/sse.py +327 -0
biotite/structure/superimpose.py +727 -0
biotite/structure/transform.py +504 -0
biotite/structure/util.py +98 -0
biotite/temp.py +86 -0
biotite/version.py +16 -0
biotite/visualize.py +251 -0
biotite-0.41.1.dist-info/METADATA +187 -0
biotite-0.41.1.dist-info/RECORD +340 -0
biotite-0.41.1.dist-info/WHEEL +4 -0
biotite-0.41.1.dist-info/licenses/LICENSE.rst +30 -0

biotite/structure/io/pdbqt/file.py ADDED Viewed

@@ -0,0 +1,640 @@
+# This source code is part of the Biotite package and is distributed
+# under the 3-Clause BSD License. Please see 'LICENSE.rst' for further
+# information.
+__name__ = "biotite.structure.io.pdbqt"
+__author__ = "Patrick Kunzmann, Daniel Bauer"
+__all__ = ["PDBQTFile"]
+import warnings
+import numpy as np
+from ....file import TextFile, InvalidFileError
+from ...error import BadStructureError
+from ...atoms import AtomArray, AtomArrayStack
+from ...charges import partial_charges
+from ...bonds import BondList, BondType, find_connected, find_rotatable_bonds
+PARAMETRIZED_ELEMENTS = [
+    "H", "C", "N", "O", "P", "S",
+    "F", "Cl", "Br", "I",
+    "Mg", "Ca", "Mn", "Fe", "Zn"
+]
+class PDBQTFile(TextFile):
+    """
+    This class represents an *AutoDock* PDBQT file.
+    This class only provides rudimentary support for reading/writing
+    the pure atom information.
+    EXPERIMENTAL: Future API changes are probable.
+    Examples
+    --------
+    Write biotin as flexible ligand into a PDBQT file:
+    >>> import os.path
+    >>> ligand = residue("BTN")
+    >>> file = PDBQTFile()
+    >>> mask = file.set_structure(ligand, rotatable_bonds="all")
+    >>> # Print removed nonpolar hydrogen atoms
+    >>> print(ligand[~mask])
+    HET         0  BTN H101   H         3.740    1.170    0.970
+    HET         0  BTN H102   H         4.070    1.340   -0.770
+    HET         0  BTN H91    H         2.800   -0.740   -1.210
+    HET         0  BTN H92    H         2.480   -0.910    0.530
+    HET         0  BTN H81    H         1.290    1.260    0.520
+    HET         0  BTN H82    H         1.620    1.440   -1.220
+    HET         0  BTN H71    H         0.350   -0.650   -1.660
+    HET         0  BTN H72    H         0.020   -0.820    0.080
+    HET         0  BTN H2     H        -0.840    1.580   -1.630
+    HET         0  BTN H61    H        -3.800    1.840    1.290
+    HET         0  BTN H62    H        -3.370    2.740   -0.200
+    HET         0  BTN H5     H        -4.310    0.810   -1.210
+    HET         0  BTN H4     H        -2.450   -0.040   -2.250
+    >>> print(file)
+    ROOT
+    HETATM    1 C11  BTN     0       5.090  -0.280   0.170  1.00  0.00     0.258 C
+    HETATM    2 O11  BTN     0       4.960  -1.470   0.030  1.00  0.00    -0.264 OA
+    ENDROOT
+    BRANCH   1   3
+    HETATM    3 O12  BTN     0       6.300   0.230   0.440  1.00  0.00    -0.331 OA
+    HETATM   17 HO2  BTN     0       7.030  -0.390   0.520  1.00  0.00     0.221 HD
+    ENDBRANCH   1   3
+    BRANCH   1   4
+    HETATM    4 C10  BTN     0       3.900   0.630   0.040  1.00  0.00     0.105 C
+    BRANCH   4   5
+    HETATM    5 C9   BTN     0       2.650  -0.200  -0.280  1.00  0.00     0.010 C
+    BRANCH   5   6
+    HETATM    6 C8   BTN     0       1.440   0.720  -0.410  1.00  0.00     0.002 C
+    BRANCH   6   7
+    HETATM    7 C7   BTN     0       0.200  -0.110  -0.730  1.00  0.00     0.016 C
+    BRANCH   7   8
+    HETATM    8 C2   BTN     0      -1.020   0.820  -0.860  1.00  0.00     0.065 C
+    HETATM    9 S1   BTN     0      -1.420   1.600   0.750  1.00  0.00    -0.154 SA
+    HETATM   10 C6   BTN     0      -3.200   1.830   0.370  1.00  0.00     0.090 C
+    HETATM   11 C5   BTN     0      -3.530   0.580  -0.480  1.00  0.00     0.091 C
+    HETATM   12 N1   BTN     0      -3.970  -0.510   0.410  1.00  0.00    -0.239 NA
+    HETATM   13 C3   BTN     0      -3.140  -1.550   0.270  1.00  0.00     0.272 C
+    HETATM   14 O3   BTN     0      -3.270  -2.590   0.890  1.00  0.00    -0.259 OA
+    HETATM   15 N2   BTN     0      -2.150  -1.340  -0.610  1.00  0.00    -0.239 NA
+    HETATM   16 C4   BTN     0      -2.290   0.010  -1.170  1.00  0.00     0.093 C
+    HETATM   18 HN1  BTN     0      -4.740  -0.470   1.000  1.00  0.00     0.132 HD
+    HETATM   19 HN2  BTN     0      -1.460  -1.980  -0.840  1.00  0.00     0.132 HD
+    ENDBRANCH   7   8
+    ENDBRANCH   6   7
+    ENDBRANCH   5   6
+    ENDBRANCH   4   5
+    ENDBRANCH   1   4
+    TORSDOF 6
+    >>> file.write(os.path.join(path_to_directory, "1l2y_mod.pdb"))
+    """
+    def get_remarks(self, model=None):
+        """
+        Get the content of ``REMARKS`` lines.
+        Parameters
+        ----------
+        model : int, optional
+            If this parameter is given, the function will return a
+            string from the remarks corresponding to the given
+            model number (starting at 1).
+            Negative values are used to index models starting from the
+            last model insted of the first model.
+            If this parameter is omitted, a list of strings
+            containing all models will be returned, even if the
+            structure contains only one model.
+        Returns
+        -------
+        lines : str or list of str
+            The content of ``REMARKS`` lines, without the leading
+            ``'REMARKS'``.
+        """
+        # Line indices where a new model starts
+        model_start_i = np.array([i for i in range(len(self.lines))
+                                  if self.lines[i].startswith(("MODEL"))],
+                                 dtype=int)
+        # Line indices with ATOM or HETATM records
+        remark_line_i = np.array([i for i in range(len(self.lines)) if
+                                  self.lines[i].startswith("REMARK")],
+                                 dtype=int)
+        # Structures containing only one model may omit MODEL record
+        # In these cases model starting index is set to 0
+        if len(model_start_i) == 0:
+            model_start_i = np.array([0])
+        if model is None:
+            # Add exclusive end of file
+            model_start_i = np.concatenate((model_start_i, [len(self.lines)]))
+            model_i = 0
+            remarks = []
+            for i in range(len(model_start_i) - 1):
+                start = model_start_i[i]
+                stop  = model_start_i[i+1]
+                model_remark_line_i = remark_line_i[
+                    (remark_line_i >= start) & (remark_line_i < stop)
+                ]
+                remarks.append(
+                    "\n".join([self.lines[i][7:] for i in model_remark_line_i])
+                )
+            return remarks
+        else:
+            last_model = len(model_start_i)
+            if model == 0:
+                raise ValueError("The model index must not be 0")
+            # Negative models mean index starting from last model
+            model = last_model + model + 1 if model < 0 else model
+            if model < last_model:
+                line_filter = ( ( remark_line_i >= model_start_i[model-1] ) &
+                                ( remark_line_i <  model_start_i[model  ] ) )
+            elif model == last_model:
+                line_filter = (remark_line_i >= model_start_i[model-1])
+            else:
+                raise ValueError(
+                    f"The file has {last_model} models, "
+                    f"the given model {model} does not exist"
+                )
+            remark_line_i = remark_line_i[line_filter]
+            # Do not include 'REMARK ' itself -> begin from pos 8
+            return "\n".join([self.lines[i][7:] for i in remark_line_i])
+    def get_structure(self, model=None):
+        """
+        Get an :class:`AtomArray` or :class:`AtomArrayStack` from the
+        PDBQT file.
+        Parameters
+        ----------
+        model : int, optional
+            If this parameter is given, the function will return an
+            :class:`AtomArray` from the atoms corresponding to the given
+            model number (starting at 1).
+            Negative values are used to index models starting from the
+            last model insted of the first model.
+            If this parameter is omitted, an :class:`AtomArrayStack`
+            containing all models will be returned, even if the
+            structure contains only one model.
+        Returns
+        -------
+        array : AtomArray or AtomArrayStack
+            The return type depends on the `model` parameter.
+        """
+        # Line indices where a new model starts
+        model_start_i = np.array([i for i in range(len(self.lines))
+                                  if self.lines[i].startswith(("MODEL"))],
+                                 dtype=int)
+        # Line indices with ATOM or HETATM records
+        atom_line_i = np.array([i for i in range(len(self.lines)) if
+                                self.lines[i].startswith(("ATOM", "HETATM"))],
+                               dtype=int)
+        # Structures containing only one model may omit MODEL record
+        # In these cases model starting index is set to 0
+        if len(model_start_i) == 0:
+            model_start_i = np.array([0])
+        if model is None:
+            depth = len(model_start_i)
+            length = self._get_model_length(model_start_i, atom_line_i)
+            array = AtomArrayStack(depth, length)
+            # Line indices for annotation determination
+            # Annotation is determined from model 1,
+            # therefore from ATOM records before second MODEL record
+            if len(model_start_i) == 1:
+                annot_i = atom_line_i
+            else:
+                annot_i = atom_line_i[atom_line_i < model_start_i[1]]
+            # Line indices for coordinate determination
+            coord_i = atom_line_i
+        else:
+            last_model = len(model_start_i)
+            if model == 0:
+                raise ValueError("The model index must not be 0")
+            # Negative models mean index starting from last model
+            model = last_model + model + 1 if model < 0 else model
+            if model < last_model:
+                line_filter = ( ( atom_line_i >= model_start_i[model-1] ) &
+                                ( atom_line_i <  model_start_i[model  ] ) )
+            elif model == last_model:
+                line_filter = (atom_line_i >= model_start_i[model-1])
+            else:
+                raise ValueError(
+                    f"The file has {last_model} models, "
+                    f"the given model {model} does not exist"
+                )
+            annot_i = coord_i = atom_line_i[line_filter]
+            array = AtomArray(len(coord_i))
+        # Save atom IDs for later sorting into the original atom order
+        atom_id  = np.zeros(array.array_length(), int)
+        # Create annotation arrays
+        chain_id  = np.zeros(array.array_length(), array.chain_id.dtype)
+        res_id    = np.zeros(array.array_length(), array.res_id.dtype)
+        ins_code  = np.zeros(array.array_length(), array.ins_code.dtype)
+        res_name  = np.zeros(array.array_length(), array.res_name.dtype)
+        hetero    = np.zeros(array.array_length(), array.hetero.dtype)
+        atom_name = np.zeros(array.array_length(), array.atom_name.dtype)
+        element   = np.zeros(array.array_length(), array.element.dtype)
+        # Fill annotation array
+        # i is index in array, line_i is line index
+        for i, line_i in enumerate(annot_i):
+            line = self.lines[line_i]
+            atom_id[i] = int(line[6:11])
+            chain_id[i] = line[21].strip()
+            res_id[i] = int(line[22:26])
+            ins_code[i] = line[26].strip()
+            res_name[i] = line[17:20].strip()
+            hetero[i] = (False if line[0:4] == "ATOM" else True)
+            atom_name[i] = line[12:16].strip()
+            element[i] = line[76:78].strip()
+        # Add annotation arrays to atom array (stack)
+        array.chain_id = chain_id
+        array.res_id = res_id
+        array.ins_code = ins_code
+        array.res_name = res_name
+        array.hetero = hetero
+        array.atom_name = atom_name
+        array.element = element
+        # Fill in coordinates
+        if isinstance(array, AtomArray):
+            for i, line_i in enumerate(coord_i):
+                line = self.lines[line_i]
+                array.coord[i,0] = float(line[30:38])
+                array.coord[i,1] = float(line[38:46])
+                array.coord[i,2] = float(line[46:54])
+        elif isinstance(array, AtomArrayStack):
+            m = 0
+            i = 0
+            for line_i in atom_line_i:
+                if m < len(model_start_i)-1 and line_i > model_start_i[m+1]:
+                    m += 1
+                    i = 0
+                line = self.lines[line_i]
+                array.coord[m,i,0] = float(line[30:38])
+                array.coord[m,i,1] = float(line[38:46])
+                array.coord[m,i,2] = float(line[46:54])
+                i += 1
+        # Sort into the original atom order
+        array = array[..., np.argsort(atom_id)]
+        return array
+    def set_structure(self, atoms, charges=None, atom_types=None,
+                      rotatable_bonds=None, root=None, include_torsdof=True):
+        """
+        Write an :class:`AtomArray` into the PDBQT file.
+        Parameters
+        ----------
+        atoms : AtomArray, shape=(n,)
+            The atoms to be written into this file.
+            Must have an associated :class:`BondList`.
+        charges : ndarray, shape=(n,), dtype=float, optional
+            Partial charges for each atom in `atoms`.
+            By default, the charges are calculated using the PEOE method
+            (:func:`partial_charges()`).
+        atom_types : ndarray, shape=(n,), dtype="U1", optional
+            Custom *AutoDock* atom types for each atom in `atoms`.
+        rotatable_bonds : None or 'rigid' or 'all' or BondList, optional
+            This parameter describes, how rotatable bonds are handled,
+            with respect to ``ROOT``, ``BRANCH`` and ``ENDBRANCH``
+            lines.
+                - ``None`` - The molecule is handled as rigid receptor:
+                  No ``ROOT``, ``BRANCH`` and ``ENDBRANCH`` lines will
+                  be written.
+                - ``'rigid'`` - The molecule is handled as rigid ligand:
+                  Only a ``ROOT`` line will be written.
+                - ``'all'`` - The molecule is handled as flexible
+                  ligand:
+                  A ``ROOT`` line will be written and all rotatable
+                  bonds are included using ``BRANCH`` and ``ENDBRANCH``
+                  lines.
+                - :class:`BondList` - The molecule is handled as
+                  flexible ligand:
+                  A ``ROOT`` line will be written and all bonds in the
+                  given :class:`BondList` are considered flexible via
+                  ``BRANCH`` and ``ENDBRANCH`` lines.
+        root : int, optional
+            Specifies the index of the atom following the ``ROOT`` line.
+            Setting the root atom is useful for specifying the *anchor*
+            in flexible side chains.
+            This parameter has no effect, if `rotatable_bonds` is
+            ``None``.
+            By default, the first atom is also the root atom.
+        include_torsdof : bool, optional
+            By default, a ``TORSDOF`` (torsional degrees of freedom)
+            record is written at the end of the file.
+            By setting this parameter to false, the record is omitted.
+        Returns
+        -------
+        mask : ndarray, shape=(n,), dtype=bool
+            A boolean mask, that is ``False`` for each atom of the input
+            ``atoms``, that was removed due to being a nonpolar
+            hydrogen.
+        """
+        # Check if AtomArray is suitable for PDBQT
+        max_atoms, max_residues = 99999, 9999
+        if atoms.array_length() > max_atoms:
+            warnings.warn(f"More then {max_atoms:,} atoms per model")
+        if (atoms.res_id > max_residues).any():
+            warnings.warn(f"Residue IDs exceed {max_residues:,}")
+        if np.isnan(atoms.coord).any():
+            raise BadStructureError("Coordinates contain 'NaN' values")
+        if any([len(name) > 1 for name in atoms.chain_id]):
+            raise BadStructureError("Some chain IDs exceed 1 character")
+        if any([len(name) > 3 for name in atoms.res_name]):
+            raise BadStructureError("Some residue names exceed 3 characters")
+        if any([len(name) > 4 for name in atoms.atom_name]):
+            raise BadStructureError("Some atom names exceed 4 characters")
+        if charges is None:
+            charges = partial_charges(atoms)
+            charges[np.isnan(charges)] = 0
+        else:
+            if np.isnan(charges).any():
+                raise ValueError("Input charges contain NaN values")
+        # Get AutoDock atom types and remove nonpolar hydrogen atoms
+        atoms, charges, types, mask = convert_atoms(atoms, charges)
+        # Overwrite calculated atom types with input atom types
+        if atom_types is not None:
+            types = atom_types[mask]
+        if rotatable_bonds is None:
+            # No rotatable bonds -> the BondList contains no bonds
+            rotatable_bonds = BondList(atoms.bonds.get_atom_count())
+            use_root = False
+        elif rotatable_bonds == "rigid":
+            rotatable_bonds = BondList(atoms.bonds.get_atom_count())
+            use_root = True
+        elif rotatable_bonds == "all":
+            rotatable_bonds = find_rotatable_bonds(atoms.bonds)
+            use_root = True
+        else:
+            if rotatable_bonds.ndim != 2 or rotatable_bonds.shape[1] != 2:
+                raise ValueError(
+                    "An (nx2) array is expected for rotatable bonds"
+                )
+            rotatable_bonds = BondList(
+                len(mask), np.asarray(rotatable_bonds)
+            )[mask]
+            use_root = True
+        if root is None:
+            root_index = 0
+        else:
+            # Find new index of root atom, since the index might have
+            # been shifted due to removed atoms
+            original_indices = np.arange(len(mask))
+            new_indices = original_indices[mask]
+            try:
+                root_index = np.where(new_indices == root)[0][0]
+            except IndexError:
+                raise ValueError(
+                    "The given root atom index points to an nonpolar hydrogen "
+                    "atom, that has been removed"
+                )
+            # Add bonds of the rigid root to rotatable bonds,
+            # as they probably have been filtered out,
+            # as the root is probably a terminal atom
+            for atom, bond_type in zip(*atoms.bonds.get_bonds(root_index)):
+                rotatable_bonds.add_bond(root_index, atom, bond_type)
+        # Break rotatable bonds
+        # for simple branch determination in '_write_atoms()'
+        atoms.bonds.remove_bonds(rotatable_bonds)
+        hetero = ["ATOM" if e == False else "HETATM" for e in atoms.hetero]
+        if "atom_id" in atoms.get_annotation_categories():
+            atom_id = atoms.atom_id
+        else:
+            atom_id = np.arange(1, atoms.array_length()+1)
+        occupancy = np.ones(atoms.array_length())
+        b_factor = np.zeros(atoms.array_length())
+        # Convert rotatable bonds into array for easier handling
+        # The bond type is irrelevant from this point on
+        rotatable_bonds = rotatable_bonds.as_array()[:,:2]
+        self.lines = []
+        self._write_atoms(
+            atoms, charges, types,
+            atom_id, hetero, occupancy, b_factor,
+            root_index, rotatable_bonds,
+            np.zeros(len(rotatable_bonds), dtype=bool), use_root
+        )
+        if include_torsdof:
+            self.lines.append(f"TORSDOF {len(rotatable_bonds)}")
+        return mask
+    def _write_atoms(self, atoms, charges, types,
+                     atom_id, hetero, occupancy, b_factor,
+                     root_atom, rotatable_bonds, visited_rotatable_bonds,
+                     is_root):
+        if len(rotatable_bonds) != 0:
+            # Get the indices to atoms of this branch, i.e. a group of
+            # atoms that are connected by non-rotatable bonds
+            # Use 'find_connected()', since rotatable bonds were removed
+            # from the BondList before
+            this_branch_indices = find_connected(atoms.bonds, root_atom)
+            # The root atom of the branch, i.e. the atom connected by
+            # the rotatable bond should always be listed first
+            # -> Remove root atom and insert it at the beginning
+            this_branch_indices = np.insert(
+                this_branch_indices[this_branch_indices != root_atom],
+                0,
+                root_atom
+            )
+        else:
+            # No rotatable bonds
+            # -> all atom are in root i.e. this branch
+            this_branch_indices = np.arange(atoms.array_length())
+        if is_root:
+            self.lines.append("ROOT")
+        for i in this_branch_indices:
+            self.lines.append(
+                f"{hetero[i]:6}"
+                f"{atom_id[i]:>5d} "
+                f"{atoms.atom_name[i]:4} "
+                f"{atoms.res_name[i]:3} "
+                f"{atoms.chain_id[i]:1}"
+                f"{atoms.res_id[i]:>4d}"
+                f"{atoms.ins_code[i]:1}   "
+                f"{atoms.coord[i,0]:>8.3f}"
+                f"{atoms.coord[i,1]:>8.3f}"
+                f"{atoms.coord[i,2]:>8.3f}"
+                f"{occupancy[i]:>6.2f}"
+                f"{b_factor[i]:>6.2f}    "
+                f"{charges[i]:>6.3f} "
+                f"{types[i]:2}"
+            )
+        if is_root:
+            self.lines.append("ENDROOT")
+        if len(rotatable_bonds) == 0:
+            # No rotatable bonds -> no branching
+            return
+        for k, (i, j) in enumerate(rotatable_bonds):
+            if visited_rotatable_bonds[k]:
+                continue
+            # Create a new branch for each rotatable bond,
+            # that connects to an atom of this branch
+            if i in this_branch_indices:
+                this_br_i = i
+                new_br_i = j
+            elif j in this_branch_indices:
+                this_br_i = j
+                new_br_i = i
+            else:
+                # Rotatable bond does not start from this branch
+                continue
+            # Mark rotatable bond as visited as otherwise branches would
+            # be created back and forth over the same rotatable bond and
+            # this method would never terminate
+            visited_rotatable_bonds[k] = True
+            self.lines.append(
+                f"BRANCH {atom_id[this_br_i]:>3d} {atom_id[new_br_i]:>3d}"
+            )
+            self._write_atoms(
+                atoms, charges, types,
+                atom_id, hetero, occupancy, b_factor,
+                # The root atom of the branch
+                #is the other atom of the rotatable bond
+                new_br_i, rotatable_bonds, visited_rotatable_bonds,
+                False
+            )
+            self.lines.append(
+                f"ENDBRANCH {atom_id[this_br_i]:>3d} {atom_id[new_br_i]:>3d}"
+            )
+    def _get_model_length(self, model_start_i, atom_line_i):
+        """
+        Determine length of models and check that all models
+        have equal length.
+        """
+        n_models = len(model_start_i)
+        length = None
+        for model_i in range(len(model_start_i)):
+            model_start = model_start_i[model_i]
+            model_stop = model_start_i[model_i+1] if model_i+1 < n_models \
+                            else len(self.lines)
+            model_length = np.count_nonzero(
+                (atom_line_i >= model_start) & (atom_line_i < model_stop)
+            )
+            if length is None:
+                length = model_length
+            if model_length != length:
+                raise InvalidFileError(
+                    f"Model {model_i+1} has {model_length} atoms, "
+                    f"but model 1 has {length} atoms, must be equal"
+                )
+        return length
+def convert_atoms(atoms, charges):
+    """
+    Convert atoms into *AutoDock* compatible atoms.
+    Parameters
+    ----------
+    atoms : AtomArray
+        The atoms to be converted.
+    charges : ndarray, dtype=float
+        Partial charges for the atoms.
+    Returns
+    -------
+    converted_atoms : AtomArray
+        The input `atoms`, but with deleted nonpolar hydrogen atoms.
+    charges : ndarray, dtype=float
+        The input `charges`, but with deleted entries for nonpolar
+        hydrogen atoms.
+    atom_types : ndarray, dtype="U1"
+        The *AutoDock* atom types.
+    mask : ndarray, shape=(n,), dtype=bool
+        A boolean mask, that is ``False`` for each atom of the input
+        ``atoms``, that was removed due to being a nonpolar hydrogen.
+    """
+    charges = charges.copy()
+    all_bonds, all_bond_types = atoms.bonds.get_all_bonds()
+    atom_types = np.zeros(atoms.array_length(), dtype="U2")
+    hydrogen_removal_mask = np.zeros(atoms.array_length(), dtype=bool)
+    for i in range(atoms.array_length()):
+        element = atoms.element[i]
+        bonded_atoms = all_bonds[i][all_bonds[i] != -1]
+        if element == "H":
+            if len(bonded_atoms) == 0:
+                # Free proton
+                atom_types[i] = "H"
+            elif len(bonded_atoms) == 1:
+                j = bonded_atoms[0]
+                bonded_element = atoms.element[j]
+                if bonded_element == "C":
+                    # Remove hydrogen and add its charge
+                    # to charge of bonded carbon
+                    charges[j] += charges[i]
+                    hydrogen_removal_mask[i] = True
+                else:
+                    atom_types[i] = "HD"
+            else:
+                raise BadStructureError(
+                    "Structure contains hydrogen with multiple bonds"
+                )
+        elif element == "C":
+            if np.isin(
+                all_bond_types[i],
+                [BondType.AROMATIC_SINGLE, BondType.AROMATIC_DOUBLE]
+            ).any():
+                # Aromatic carbon
+                atom_types[i] = "A"
+            else:
+                # Alphatic carbon
+                atom_types[i] = "C"
+        elif element == "N":
+            atom_types[i] = "NA"
+        elif element == "O":
+            atom_types[i] = "OA"
+        elif element == "S":
+            atom_types[i] = "SA"
+        elif element.capitalize() in PARAMETRIZED_ELEMENTS:
+            atom_types[i] = element.capitalize()
+        else:
+            warnings.warn(
+                f"Element {element} is not paramtrized, "
+                f"using parameters for hydrogen instead"
+            )
+            atom_types[i] = "H"
+    mask = ~hydrogen_removal_mask
+    return atoms[mask], charges[mask], atom_types[mask], mask

biotite/structure/io/pdbx/__init__.py ADDED Viewed

@@ -0,0 +1,23 @@
+# This source code is part of the Biotite package and is distributed
+# under the 3-Clause BSD License. Please see 'LICENSE.rst' for further
+# information.
+"""
+This subpackage provides support for the the modern PDBx file formats.
+The :class:`CIFFile` class provides dictionary-like access to
+every field in text-based *mmCIF* files.
+:class:`BinaryCIFFile` provides analogous functionality for the
+*BinaryCIF* format.
+Additional utility functions allow reading and writing structures
+from/to these files.
+"""
+__name__ = "biotite.structure.io.pdbx"
+__author__ = "Patrick Kunzmann"
+from .convert import *
+from .bcif import *
+from .cif import *
+from .component import *
+from .encoding import *
+from .legacy import *