PyPI - biotite - Versions diffs - 0.41.1__cp312-cp312-win_amd64.whl → 1.0.0__cp312-cp312-win_amd64.whl - Mend

biotite 0.41.1__cp312-cp312-win_amd64.whl → 1.0.0__cp312-cp312-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of biotite might be problematic. Click here for more details.

Files changed (205) hide show

biotite/__init__.py +2 -3
biotite/application/__init__.py +36 -10
biotite/application/application.py +22 -11
biotite/application/autodock/__init__.py +1 -1
biotite/application/autodock/app.py +74 -79
biotite/application/blast/__init__.py +1 -1
biotite/application/blast/alignment.py +19 -10
biotite/application/blast/webapp.py +92 -85
biotite/application/clustalo/__init__.py +1 -1
biotite/application/clustalo/app.py +46 -61
biotite/application/dssp/__init__.py +1 -1
biotite/application/dssp/app.py +8 -11
biotite/application/localapp.py +62 -60
biotite/application/mafft/__init__.py +1 -1
biotite/application/mafft/app.py +16 -22
biotite/application/msaapp.py +78 -89
biotite/application/muscle/__init__.py +1 -1
biotite/application/muscle/app3.py +50 -64
biotite/application/muscle/app5.py +23 -31
biotite/application/sra/__init__.py +1 -1
biotite/application/sra/app.py +64 -68
biotite/application/tantan/__init__.py +1 -1
biotite/application/tantan/app.py +22 -45
biotite/application/util.py +7 -9
biotite/application/viennarna/rnaalifold.py +34 -28
biotite/application/viennarna/rnafold.py +24 -39
biotite/application/viennarna/rnaplot.py +36 -21
biotite/application/viennarna/util.py +17 -12
biotite/application/webapp.py +13 -14
biotite/copyable.py +13 -13
biotite/database/__init__.py +1 -1
biotite/database/entrez/__init__.py +1 -1
biotite/database/entrez/check.py +2 -3
biotite/database/entrez/dbnames.py +7 -5
biotite/database/entrez/download.py +55 -49
biotite/database/entrez/key.py +1 -1
biotite/database/entrez/query.py +62 -23
biotite/database/error.py +2 -1
biotite/database/pubchem/__init__.py +1 -1
biotite/database/pubchem/download.py +43 -45
biotite/database/pubchem/error.py +2 -2
biotite/database/pubchem/query.py +34 -31
biotite/database/pubchem/throttle.py +3 -4
biotite/database/rcsb/__init__.py +1 -1
biotite/database/rcsb/download.py +44 -52
biotite/database/rcsb/query.py +85 -80
biotite/database/uniprot/check.py +6 -3
biotite/database/uniprot/download.py +6 -11
biotite/database/uniprot/query.py +115 -31
biotite/file.py +12 -31
biotite/sequence/__init__.py +16 -5
biotite/sequence/align/__init__.py +160 -6
biotite/sequence/align/alignment.py +99 -90
biotite/sequence/align/banded.cp312-win_amd64.pyd +0 -0
biotite/sequence/align/buckets.py +12 -10
biotite/sequence/align/cigar.py +43 -52
biotite/sequence/align/kmeralphabet.cp312-win_amd64.pyd +0 -0
biotite/sequence/align/kmeralphabet.pyx +55 -51
biotite/sequence/align/kmersimilarity.cp312-win_amd64.pyd +0 -0
biotite/sequence/align/kmertable.cp312-win_amd64.pyd +0 -0
biotite/sequence/align/kmertable.pyx +3 -2
biotite/sequence/align/localgapped.cp312-win_amd64.pyd +0 -0
biotite/sequence/align/localungapped.cp312-win_amd64.pyd +0 -0
biotite/sequence/align/matrix.py +81 -82
biotite/sequence/align/multiple.cp312-win_amd64.pyd +0 -0
biotite/sequence/align/multiple.pyx +35 -35
biotite/sequence/align/pairwise.cp312-win_amd64.pyd +0 -0
biotite/sequence/align/permutation.cp312-win_amd64.pyd +0 -0
biotite/sequence/align/permutation.pyx +12 -4
biotite/sequence/align/selector.cp312-win_amd64.pyd +0 -0
biotite/sequence/align/selector.pyx +52 -54
biotite/sequence/align/statistics.py +32 -33
biotite/sequence/align/tracetable.cp312-win_amd64.pyd +0 -0
biotite/sequence/alphabet.py +112 -126
biotite/sequence/annotation.py +78 -77
biotite/sequence/codec.cp312-win_amd64.pyd +0 -0
biotite/sequence/codon.py +90 -79
biotite/sequence/graphics/__init__.py +1 -1
biotite/sequence/graphics/alignment.py +184 -103
biotite/sequence/graphics/colorschemes.py +10 -12
biotite/sequence/graphics/dendrogram.py +79 -34
biotite/sequence/graphics/features.py +133 -99
biotite/sequence/graphics/logo.py +22 -28
biotite/sequence/graphics/plasmid.py +229 -178
biotite/sequence/io/fasta/__init__.py +1 -1
biotite/sequence/io/fasta/convert.py +44 -33
biotite/sequence/io/fasta/file.py +42 -55
biotite/sequence/io/fastq/__init__.py +1 -1
biotite/sequence/io/fastq/convert.py +11 -14
biotite/sequence/io/fastq/file.py +68 -112
biotite/sequence/io/genbank/__init__.py +2 -2
biotite/sequence/io/genbank/annotation.py +12 -20
biotite/sequence/io/genbank/file.py +74 -76
biotite/sequence/io/genbank/metadata.py +74 -62
biotite/sequence/io/genbank/sequence.py +13 -14
biotite/sequence/io/general.py +39 -30
biotite/sequence/io/gff/__init__.py +2 -2
biotite/sequence/io/gff/convert.py +10 -15
biotite/sequence/io/gff/file.py +81 -65
biotite/sequence/phylo/__init__.py +1 -1
biotite/sequence/phylo/nj.cp312-win_amd64.pyd +0 -0
biotite/sequence/phylo/tree.cp312-win_amd64.pyd +0 -0
biotite/sequence/phylo/upgma.cp312-win_amd64.pyd +0 -0
biotite/sequence/profile.py +57 -28
biotite/sequence/search.py +17 -15
biotite/sequence/seqtypes.py +200 -164
biotite/sequence/sequence.py +64 -64
biotite/structure/__init__.py +3 -3
biotite/structure/atoms.py +226 -240
biotite/structure/basepairs.py +260 -271
biotite/structure/bonds.cp312-win_amd64.pyd +0 -0
biotite/structure/bonds.pyx +88 -100
biotite/structure/box.py +67 -71
biotite/structure/celllist.cp312-win_amd64.pyd +0 -0
biotite/structure/chains.py +55 -39
biotite/structure/charges.cp312-win_amd64.pyd +0 -0
biotite/structure/compare.py +32 -32
biotite/structure/density.py +13 -18
biotite/structure/dotbracket.py +20 -22
biotite/structure/error.py +10 -2
biotite/structure/filter.py +82 -77
biotite/structure/geometry.py +130 -119
biotite/structure/graphics/atoms.py +60 -43
biotite/structure/graphics/rna.py +81 -68
biotite/structure/hbond.py +112 -93
biotite/structure/info/__init__.py +0 -2
biotite/structure/info/atoms.py +10 -11
biotite/structure/info/bonds.py +41 -43
biotite/structure/info/ccd.py +21 -7
biotite/structure/info/groups.py +10 -15
biotite/structure/info/masses.py +5 -10
biotite/structure/info/misc.py +1 -1
biotite/structure/info/radii.py +20 -20
biotite/structure/info/standardize.py +15 -26
biotite/structure/integrity.py +18 -71
biotite/structure/io/__init__.py +3 -4
biotite/structure/io/dcd/__init__.py +1 -1
biotite/structure/io/dcd/file.py +22 -20
biotite/structure/io/general.py +47 -61
biotite/structure/io/gro/__init__.py +1 -1
biotite/structure/io/gro/file.py +73 -72
biotite/structure/io/mol/__init__.py +1 -1
biotite/structure/io/mol/convert.py +8 -11
biotite/structure/io/mol/ctab.py +37 -36
biotite/structure/io/mol/header.py +14 -10
biotite/structure/io/mol/mol.py +9 -53
biotite/structure/io/mol/sdf.py +47 -50
biotite/structure/io/netcdf/__init__.py +1 -1
biotite/structure/io/netcdf/file.py +24 -23
biotite/structure/io/pdb/__init__.py +1 -1
biotite/structure/io/pdb/convert.py +32 -20
biotite/structure/io/pdb/file.py +151 -172
biotite/structure/io/pdb/hybrid36.cp312-win_amd64.pyd +0 -0
biotite/structure/io/pdbqt/__init__.py +1 -1
biotite/structure/io/pdbqt/convert.py +17 -11
biotite/structure/io/pdbqt/file.py +128 -80
biotite/structure/io/pdbx/__init__.py +1 -2
biotite/structure/io/pdbx/bcif.py +36 -52
biotite/structure/io/pdbx/cif.py +64 -62
biotite/structure/io/pdbx/component.py +10 -16
biotite/structure/io/pdbx/convert.py +235 -246
biotite/structure/io/pdbx/encoding.cp312-win_amd64.pyd +0 -0
biotite/structure/io/trajfile.py +76 -93
biotite/structure/io/trr/__init__.py +1 -1
biotite/structure/io/trr/file.py +12 -15
biotite/structure/io/xtc/__init__.py +1 -1
biotite/structure/io/xtc/file.py +11 -14
biotite/structure/mechanics.py +9 -11
biotite/structure/molecules.py +3 -4
biotite/structure/pseudoknots.py +53 -67
biotite/structure/rdf.py +23 -21
biotite/structure/repair.py +137 -86
biotite/structure/residues.py +26 -16
biotite/structure/sasa.cp312-win_amd64.pyd +0 -0
biotite/structure/{resutil.py → segments.py} +24 -23
biotite/structure/sequence.py +10 -11
biotite/structure/sse.py +100 -119
biotite/structure/superimpose.py +39 -77
biotite/structure/transform.py +97 -71
biotite/structure/util.py +11 -13
biotite/version.py +2 -2
biotite/visualize.py +69 -55
{biotite-0.41.1.dist-info → biotite-1.0.0.dist-info}/METADATA +6 -6
biotite-1.0.0.dist-info/RECORD +322 -0
{biotite-0.41.1.dist-info → biotite-1.0.0.dist-info}/WHEEL +1 -1
biotite/structure/io/ctab.py +0 -72
biotite/structure/io/mmtf/__init__.py +0 -21
biotite/structure/io/mmtf/assembly.py +0 -214
biotite/structure/io/mmtf/convertarray.cp312-win_amd64.pyd +0 -0
biotite/structure/io/mmtf/convertarray.pyx +0 -341
biotite/structure/io/mmtf/convertfile.cp312-win_amd64.pyd +0 -0
biotite/structure/io/mmtf/convertfile.pyx +0 -501
biotite/structure/io/mmtf/decode.cp312-win_amd64.pyd +0 -0
biotite/structure/io/mmtf/decode.pyx +0 -152
biotite/structure/io/mmtf/encode.cp312-win_amd64.pyd +0 -0
biotite/structure/io/mmtf/encode.pyx +0 -183
biotite/structure/io/mmtf/file.py +0 -233
biotite/structure/io/npz/__init__.py +0 -20
biotite/structure/io/npz/file.py +0 -152
biotite/structure/io/pdbx/legacy.py +0 -267
biotite/structure/io/tng/__init__.py +0 -13
biotite/structure/io/tng/file.py +0 -46
biotite/temp.py +0 -86
biotite-0.41.1.dist-info/RECORD +0 -340
{biotite-0.41.1.dist-info → biotite-1.0.0.dist-info}/licenses/LICENSE.rst +0 -0

biotite/sequence/io/fastq/file.py CHANGED Viewed

@@ -5,23 +5,21 @@
 __name__ = "biotite.sequence.io.fastq"
 __author__ = "Patrick Kunzmann"
-import warnings
-from numbers import Integral
 from collections import OrderedDict
 from collections.abc import MutableMapping
+from numbers import Integral
 import numpy as np
-from ....file import TextFile, InvalidFileError, wrap_string
-from ...seqtypes import NucleotideSequence
+from biotite.file import InvalidFileError, TextFile, wrap_string
 __all__ = ["FastqFile"]
 _OFFSETS = {
-    "Sanger"       : 33,
-    "Solexa"       : 64,
-    "Illumina-1.3" : 64,
-    "Illumina-1.5" : 64,
-    "Illumina-1.8" : 33,
+    "Sanger": 33,
+    "Solexa": 64,
+    "Illumina-1.3": 64,
+    "Illumina-1.5": 64,
+    "Illumina-1.8": 33,
 }
@@ -47,7 +45,7 @@ class FastqFile(TextFile, MutableMapping):
     An identifier string (without the leading ``@``) is used as index
     to get and set the corresponding sequence and quality.
     ``del`` removes an entry in the file.
     Parameters
     ----------
     offset : int or {'Sanger', 'Solexa', 'Illumina-1.3', 'Illumina-1.5', 'Illumina-1.8'}
@@ -61,10 +59,10 @@ class FastqFile(TextFile, MutableMapping):
         Only relevant, when adding sequences to a file.
         By default each sequence (and score string)
         is put into one line.
     Examples
     --------
     >>> import os.path
     >>> file = FastqFile(offset="Sanger")
     >>> file["seq1"] = str(NucleotideSequence("ATACT")), [0,3,10,7,12]
@@ -91,18 +89,18 @@ class FastqFile(TextFile, MutableMapping):
     0.96=GD
     >>> file.write(os.path.join(path_to_directory, "test.fastq"))
     """
     def __init__(self, offset, chars_per_line=None):
         super().__init__()
         self._chars_per_line = chars_per_line
         self._entries = OrderedDict()
         self._offset = _convert_offset(offset)
     @classmethod
     def read(cls, file, offset, chars_per_line=None):
         """
         Read a FASTQ file.
         Parameters
         ----------
         file : file-like object or str
@@ -119,7 +117,7 @@ class FastqFile(TextFile, MutableMapping):
             Only relevant, when adding sequences to a file.
             By default each sequence (and score string)
             is put into one line.
         Returns
         -------
         file_object : FastqFile
@@ -134,31 +132,7 @@ class FastqFile(TextFile, MutableMapping):
             raise InvalidFileError("File is empty")
         file._find_entries()
         return file
-    def get_sequence(self, identifier):
-        """
-        Get the sequence for the specified identifier.
-        DEPRECATED: Use :meth:`get_seq_string()` or
-        :func:`get_sequence()` instead.
-        Parameters
-        ----------
-        identifier : str
-            The identifier of the sequence.
-        Returns
-        -------
-        sequence : NucleotideSequence
-            The sequence corresponding to the identifier.
-        """
-        warnings.warn(
-            "'get_sequence()' is deprecated, use the 'get_seq_string()'"
-            "method or 'fasta.get_sequence()' function instead",
-            DeprecationWarning
-        )
-        return NucleotideSequence(self.get_seq_string(identifier))
     def get_seq_string(self, identifier):
         """
         Get the string representing the sequence for the specified
@@ -168,22 +142,19 @@ class FastqFile(TextFile, MutableMapping):
         ----------
         identifier : str
             The identifier of the sequence.
         Returns
         -------
         sequence : str
             The sequence corresponding to the identifier.
         """
         if not isinstance(identifier, str):
-            raise IndexError(
-                "'FastqFile' only supports identifier strings as keys"
-            )
-        seq_start, seq_stop, score_start, score_stop \
-            = self._entries[identifier]
+            raise IndexError("'FastqFile' only supports identifier strings as keys")
+        seq_start, seq_stop, score_start, score_stop = self._entries[identifier]
         # Concatenate sequence string from the sequence lines
-        seq_str = "".join(self.lines[seq_start : seq_stop])
+        seq_str = "".join(self.lines[seq_start:seq_stop])
         return seq_str
     def get_quality(self, identifier):
         """
         Get the quality scores for the specified identifier.
@@ -192,24 +163,20 @@ class FastqFile(TextFile, MutableMapping):
         ----------
         identifier : str
             The identifier of the quality scores.
         Returns
         -------
         scores : ndarray, dtype=int
             The quality scores corresponding to the identifier.
         """
         if not isinstance(identifier, str):
-            raise IndexError(
-                "'FastqFile' only supports identifier strings as keys"
-            )
-        seq_start, seq_stop, score_start, score_stop \
-            = self._entries[identifier]
+            raise IndexError("'FastqFile' only supports identifier strings as keys")
+        seq_start, seq_stop, score_start, score_stop = self._entries[identifier]
         # Concatenate sequence string from the score lines
         return _score_str_to_scores(
-            "".join(self.lines[score_start : score_stop]),
-            self._offset
+            "".join(self.lines[score_start:score_stop]), self._offset
         )
     def __setitem__(self, identifier, item):
         sequence, scores = item
         if len(sequence) != len(scores):
@@ -218,24 +185,22 @@ class FastqFile(TextFile, MutableMapping):
                 f"but score length is {len(scores)}"
             )
         if not isinstance(identifier, str):
-            raise IndexError(
-                "'FastqFile' only supports strings as identifier"
-            )
+            raise IndexError("'FastqFile' only supports strings as identifier")
         # Delete lines of entry corresponding to the identifier,
         # if already existing
         if identifier in self:
             del self[identifier]
         # Create new lines
         # Start with identifier line
-        new_lines = ["@" + identifier.replace("\n","").strip()]
+        new_lines = ["@" + identifier.replace("\n", "").strip()]
         # Append new lines with sequence string (with line breaks)
         seq_start_i = len(new_lines)
         if self._chars_per_line is None:
             new_lines.append(str(sequence))
         else:
             new_lines += wrap_string(sequence, width=self._chars_per_line)
-        seq_stop_i =len(new_lines)
+        seq_stop_i = len(new_lines)
         # Append sequence-score separator
         new_lines += ["+"]
         # Append scores
@@ -261,29 +226,28 @@ class FastqFile(TextFile, MutableMapping):
                 len(self.lines) + seq_start_i,
                 len(self.lines) + seq_stop_i,
                 len(self.lines) + score_start_i,
-                len(self.lines) + score_stop_i
+                len(self.lines) + score_stop_i,
             )
             self.lines += new_lines
     def __getitem__(self, identifier):
         return self.get_seq_string(identifier), self.get_quality(identifier)
     def __delitem__(self, identifier):
-        seq_start, seq_stop, score_start, score_stop \
-            = self._entries[identifier]
-        del self.lines[seq_start-1 : score_stop]
+        seq_start, seq_stop, score_start, score_stop = self._entries[identifier]
+        del self.lines[seq_start - 1 : score_stop]
         del self._entries[identifier]
         self._find_entries()
     def __len__(self):
         return len(self._entries)
     def __iter__(self):
         return self._entries.__iter__()
     def __contains__(self, identifer):
         return identifer in self._entries
     def _find_entries(self):
         self._entries = OrderedDict()
         in_sequence = False
@@ -302,7 +266,7 @@ class FastqFile(TextFile, MutableMapping):
             if not in_scores and not in_sequence and line[0] == "@":
                 # Identifier line
                 identifier = line[1:]
-                seq_start_i = i+1
+                seq_start_i = i + 1
                 # Next line is sequence
                 in_sequence = True
                 # Reset
@@ -314,7 +278,7 @@ class FastqFile(TextFile, MutableMapping):
                     in_sequence = False
                     in_scores = True
                     seq_stop_i = i
-                    score_start_i = i+1
+                    score_start_i = i + 1
                 else:
                     # Still in sequence
                     seq_len += len(line)
@@ -330,9 +294,12 @@ class FastqFile(TextFile, MutableMapping):
                     in_scores = False
                     # Record this entry
                     self._entries[identifier] = (
-                        seq_start_i, seq_stop_i, score_start_i, score_stop_i
+                        seq_start_i,
+                        seq_stop_i,
+                        score_start_i,
+                        score_stop_i,
                     )
-                else: # score_len > seq_len
+                else:  # score_len > seq_len
                     raise InvalidFileError(
                         f"The amount of scores is not equal to the sequence "
                         f"length for the sequence in line {seq_start_i+1} "
@@ -343,14 +310,13 @@ class FastqFile(TextFile, MutableMapping):
         # must have properly ended
         if in_sequence or in_scores:
             raise InvalidFileError("The last entry in the file is incomplete")
     @staticmethod
     def read_iter(file, offset):
         """
         Create an iterator over each sequence (and corresponding scores)
         of the given FASTQ file.
         Parameters
         ----------
         file : file-like object or str
@@ -361,7 +327,7 @@ class FastqFile(TextFile, MutableMapping):
             ASCII code.
             Can either be directly the value, or a string that indicates
             the score format.
         Yields
         ------
         identifier : str
@@ -369,7 +335,7 @@ class FastqFile(TextFile, MutableMapping):
         sequence : tuple(str, ndarray)
             The current sequence as string and its corresponding quality
             scores as :class:`ndarray`.
         Notes
         -----
         This approach gives the same results as
@@ -377,7 +343,7 @@ class FastqFile(TextFile, MutableMapping):
         and much more memory efficient.
         """
         offset = _convert_offset(offset)
         identifier = None
         seq_str_list = []
         score_str_list = []
@@ -391,7 +357,7 @@ class FastqFile(TextFile, MutableMapping):
             # Ignore empty lines
             if len(line) == 0:
                 continue
             if not in_scores and not in_sequence and line[0] == "@":
                 # Track new entry
                 identifier = line[1:]
@@ -401,7 +367,7 @@ class FastqFile(TextFile, MutableMapping):
                 score_len = 0
                 seq_str_list = []
                 score_str_list = []
             elif in_sequence:
                 if line[0] == "+":
                     # End of sequence start of scores
@@ -411,7 +377,7 @@ class FastqFile(TextFile, MutableMapping):
                     # Still in sequence
                     seq_len += len(line)
                     seq_str_list.append(line)
             elif in_scores:
                 score_len += len(line)
                 score_str_list.append(line)
@@ -422,20 +388,15 @@ class FastqFile(TextFile, MutableMapping):
                     # -> End of entry
                     in_scores = False
                     # yield this entry
-                    scores = _score_str_to_scores(
-                        "".join(score_str_list),
-                        offset
-                    )
+                    scores = _score_str_to_scores("".join(score_str_list), offset)
                     yield identifier, ("".join(seq_str_list), scores)
-                else: # score_len > seq_len
+                else:  # score_len > seq_len
                     raise InvalidFileError(
-                        f"The amount of scores is not equal to the sequence "
-                        f"length"
+                        "The amount of scores is not equal to the sequence " "length"
                     )
             else:
-                raise InvalidFileError(f"FASTQ file is invalid")
+                raise InvalidFileError("FASTQ file is invalid")
     @staticmethod
     def write_iter(file, items, offset, chars_per_line=None):
@@ -449,7 +410,7 @@ class FastqFile(TextFile, MutableMapping):
         Hence, this static method may save a large amount of memory if
         a large file should be written, especially if the `items`
         are provided as generator.
         Parameters
         ----------
         file : file-like object or str
@@ -487,12 +448,10 @@ class FastqFile(TextFile, MutableMapping):
                         f"but score length is {len(scores)}"
                     )
                 if not isinstance(identifier, str):
-                    raise IndexError(
-                        "'FastqFile' only supports strings as identifier"
-                    )
+                    raise IndexError("'FastqFile' only supports strings as identifier")
                 # Yield identifier line
-                yield "@" + identifier.replace("\n","").strip()
+                yield "@" + identifier.replace("\n", "").strip()
                 # Yield sequence line(s)
                 if chars_per_line is None:
@@ -500,10 +459,10 @@ class FastqFile(TextFile, MutableMapping):
                 else:
                     for line in wrap_string(sequence, width=chars_per_line):
                         yield line
                 # Yield separator
                 yield "+"
                 # Yield scores
                 score_chars = _scores_to_score_str(scores, offset)
                 if chars_per_line is None:
@@ -511,7 +470,7 @@ class FastqFile(TextFile, MutableMapping):
                 else:
                     for line in wrap_string(score_chars, width=chars_per_line):
                         yield line
         TextFile.write_iter(file, line_generator())
@@ -519,15 +478,11 @@ def _score_str_to_scores(score_str, offset):
     """
     Convert an ASCII string into actual score values.
     """
-    scores = np.frombuffer(
-        bytearray(
-            score_str, encoding="ascii"
-        ),
-        dtype=np.int8
-    )
+    scores = np.frombuffer(bytearray(score_str, encoding="ascii"), dtype=np.int8)
     scores -= offset
     return scores
 def _scores_to_score_str(scores, offset):
     """
     Convert score values into an ASCII string.
@@ -535,6 +490,7 @@ def _scores_to_score_str(scores, offset):
     scores = np.asarray(scores) + offset
     return scores.astype(np.int8, copy=False).tobytes().decode("ascii")
 def _convert_offset(offset_val_or_string):
     """
     If the given offset is a string return the corresponding numerical
@@ -543,9 +499,9 @@ def _convert_offset(offset_val_or_string):
     if isinstance(offset_val_or_string, Integral):
         return offset_val_or_string
     elif isinstance(offset_val_or_string, str):
-       return _OFFSETS[offset_val_or_string]
+        return _OFFSETS[offset_val_or_string]
     else:
         raise TypeError(
             f"The offset must be either an integer or a string "
             f"indicating the format, not {type(offset_val_or_string).__name__}"
-        )
+        )

biotite/sequence/io/genbank/__init__.py CHANGED Viewed

@@ -11,7 +11,7 @@ and *GenPept* format.
 __name__ = "biotite.sequence.io.genbank"
 __author__ = "Patrick Kunzmann"
-from .file import *
 from .annotation import *
+from .file import *
+from .metadata import *
 from .sequence import *
-from .metadata import *

biotite/sequence/io/genbank/annotation.py CHANGED Viewed

@@ -12,10 +12,8 @@ __all__ = ["get_annotation", "set_annotation"]
 import re
 import warnings
-from ....file import InvalidFileError
-from ...annotation import Annotation, Feature, Location
-from .file import GenBankFile
+from biotite.file import InvalidFileError
+from biotite.sequence.annotation import Annotation, Feature, Location
 _KEY_START = 5
 _QUAL_START = 21
@@ -46,7 +44,6 @@ def get_annotation(gb_file, include_only=None):
         raise InvalidFileError("File has multiple 'FEATURES' fields")
     lines, _ = fields[0]
     ### Parse all lines to create an index of features,
     # i.e. pairs of the feature key
     # and the text belonging to the respective feature
@@ -60,13 +57,12 @@ def get_annotation(gb_file, include_only=None):
                 # Store old feature key and value
                 feature_list.append((feature_key, feature_value))
             # Track new key
-            feature_key = line[_KEY_START : _QUAL_START-1].strip()
+            feature_key = line[_KEY_START : _QUAL_START - 1].strip()
             feature_value = ""
         feature_value += line[_QUAL_START:] + " "
     # Store last feature key and value (loop already exited)
     feature_list.append((feature_key, feature_value))
     ### Process only relevant features and put them into an Annotation
     annotation = Annotation()
     # Regex to separate qualifiers from each other
@@ -92,7 +88,7 @@ def get_annotation(gb_file, include_only=None):
             loc_string = qualifier_parts.pop(0).strip()
             try:
                 locs = _parse_locs(loc_string)
-            except:
+            except Exception:
                 warnings.warn(
                     f"'{loc_string}' is an unsupported location identifier, "
                     f"skipping feature"
@@ -114,7 +110,7 @@ def get_annotation(gb_file, include_only=None):
                     # -> split at whitespaces,
                     # as keys do not contain whitespaces
                     for subpart in part.split():
-                        if not "=" in subpart:
+                        if "=" not in subpart:
                             # Qualifier without value, e.g. '/pseudo'
                             # -> store immediately
                             # Remove "/" -> subpart[1:]
@@ -147,11 +143,11 @@ def get_annotation(gb_file, include_only=None):
 def _parse_locs(loc_str):
     locs = []
     if loc_str.startswith(("join", "order")):
-        str_list = loc_str[loc_str.index("(")+1:loc_str.rindex(")")].split(",")
+        str_list = loc_str[loc_str.index("(") + 1 : loc_str.rindex(")")].split(",")
         for s in str_list:
             locs.extend(_parse_locs(s.strip()))
     elif loc_str.startswith("complement"):
-        compl_str = loc_str[loc_str.index("(")+1:loc_str.rindex(")")]
+        compl_str = loc_str[loc_str.index("(") + 1 : loc_str.rindex(")")]
         compl_locs = [
             Location(loc.first, loc.last, Location.Strand.REVERSE, loc.defect)
             for loc in _parse_locs(compl_str)
@@ -214,8 +210,6 @@ def _set_qual(qual_dict, key, val):
         qual_dict[key] = val
 def set_annotation(gb_file, annotation):
     """
     Set the *FEATURES* field of a GenBank file with an annotation.
@@ -236,12 +230,12 @@ def set_annotation(gb_file, annotation):
         for key, values in feature.qual.items():
             if values is None:
                 line = " " * _QUAL_START
-                line +=  f'/{key}'
+                line += f"/{key}"
                 lines.append(line)
             else:
                 for val in values.split("\n"):
                     line = " " * _QUAL_START
-                    line +=  f'/{key}="{val}"'
+                    line += f'/{key}="{val}"'
                     lines.append(line)
     gb_file.set_field("FEATURES", lines)
@@ -254,11 +248,11 @@ def _convert_to_loc_string(locs):
     if len(locs) == 1:
         loc = list(locs)[0]
         loc_first_str = str(loc.first)
-        loc_last_str  = str(loc.last)
+        loc_last_str = str(loc.last)
         if loc.defect & Location.Defect.BEYOND_LEFT:
             loc_first_str = "<" + loc_first_str
         if loc.defect & Location.Defect.BEYOND_RIGHT:
-            loc_last_str  = ">" + loc_last_str
+            loc_last_str = ">" + loc_last_str
         if loc.first == loc.last:
             loc_string = loc_first_str
         elif loc.defect & Location.Defect.UNK_LOC:
@@ -270,8 +264,6 @@ def _convert_to_loc_string(locs):
         if loc.strand == Location.Strand.REVERSE:
             loc_string = f"complement({loc_string})"
     else:
-        loc_string = ",".join(
-            [_convert_to_loc_string([loc]) for loc in locs]
-        )
+        loc_string = ",".join([_convert_to_loc_string([loc]) for loc in locs])
         loc_string = f"join({loc_string})"
     return loc_string