PyPI - biotite - Versions diffs - 0.41.2__cp310-cp310-win_amd64.whl → 1.0.0__cp310-cp310-win_amd64.whl - Mend

biotite 0.41.2__cp310-cp310-win_amd64.whl → 1.0.0__cp310-cp310-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of biotite might be problematic. Click here for more details.

Files changed (205) hide show

biotite/__init__.py +2 -3
biotite/application/__init__.py +1 -1
biotite/application/application.py +20 -10
biotite/application/autodock/__init__.py +1 -1
biotite/application/autodock/app.py +74 -79
biotite/application/blast/__init__.py +1 -1
biotite/application/blast/alignment.py +19 -10
biotite/application/blast/webapp.py +92 -85
biotite/application/clustalo/__init__.py +1 -1
biotite/application/clustalo/app.py +46 -61
biotite/application/dssp/__init__.py +1 -1
biotite/application/dssp/app.py +8 -11
biotite/application/localapp.py +62 -60
biotite/application/mafft/__init__.py +1 -1
biotite/application/mafft/app.py +16 -22
biotite/application/msaapp.py +78 -89
biotite/application/muscle/__init__.py +1 -1
biotite/application/muscle/app3.py +50 -64
biotite/application/muscle/app5.py +23 -31
biotite/application/sra/__init__.py +1 -1
biotite/application/sra/app.py +64 -68
biotite/application/tantan/__init__.py +1 -1
biotite/application/tantan/app.py +22 -45
biotite/application/util.py +7 -9
biotite/application/viennarna/rnaalifold.py +34 -28
biotite/application/viennarna/rnafold.py +24 -39
biotite/application/viennarna/rnaplot.py +36 -21
biotite/application/viennarna/util.py +17 -12
biotite/application/webapp.py +13 -14
biotite/copyable.py +13 -13
biotite/database/__init__.py +1 -1
biotite/database/entrez/__init__.py +1 -1
biotite/database/entrez/check.py +2 -3
biotite/database/entrez/dbnames.py +7 -5
biotite/database/entrez/download.py +55 -49
biotite/database/entrez/key.py +1 -1
biotite/database/entrez/query.py +62 -23
biotite/database/error.py +2 -1
biotite/database/pubchem/__init__.py +1 -1
biotite/database/pubchem/download.py +43 -45
biotite/database/pubchem/error.py +2 -2
biotite/database/pubchem/query.py +34 -31
biotite/database/pubchem/throttle.py +3 -4
biotite/database/rcsb/__init__.py +1 -1
biotite/database/rcsb/download.py +44 -52
biotite/database/rcsb/query.py +85 -80
biotite/database/uniprot/check.py +6 -3
biotite/database/uniprot/download.py +6 -11
biotite/database/uniprot/query.py +115 -31
biotite/file.py +12 -31
biotite/sequence/__init__.py +3 -3
biotite/sequence/align/__init__.py +2 -2
biotite/sequence/align/alignment.py +99 -90
biotite/sequence/align/banded.cp310-win_amd64.pyd +0 -0
biotite/sequence/align/buckets.py +12 -10
biotite/sequence/align/cigar.py +43 -52
biotite/sequence/align/kmeralphabet.cp310-win_amd64.pyd +0 -0
biotite/sequence/align/kmeralphabet.pyx +55 -51
biotite/sequence/align/kmersimilarity.cp310-win_amd64.pyd +0 -0
biotite/sequence/align/kmertable.cp310-win_amd64.pyd +0 -0
biotite/sequence/align/kmertable.pyx +3 -2
biotite/sequence/align/localgapped.cp310-win_amd64.pyd +0 -0
biotite/sequence/align/localungapped.cp310-win_amd64.pyd +0 -0
biotite/sequence/align/matrix.py +81 -82
biotite/sequence/align/multiple.cp310-win_amd64.pyd +0 -0
biotite/sequence/align/multiple.pyx +1 -1
biotite/sequence/align/pairwise.cp310-win_amd64.pyd +0 -0
biotite/sequence/align/permutation.cp310-win_amd64.pyd +0 -0
biotite/sequence/align/permutation.pyx +12 -4
biotite/sequence/align/selector.cp310-win_amd64.pyd +0 -0
biotite/sequence/align/selector.pyx +52 -54
biotite/sequence/align/statistics.py +32 -33
biotite/sequence/align/tracetable.cp310-win_amd64.pyd +0 -0
biotite/sequence/alphabet.py +51 -65
biotite/sequence/annotation.py +78 -77
biotite/sequence/codec.cp310-win_amd64.pyd +0 -0
biotite/sequence/codon.py +90 -79
biotite/sequence/graphics/__init__.py +1 -1
biotite/sequence/graphics/alignment.py +184 -103
biotite/sequence/graphics/colorschemes.py +10 -12
biotite/sequence/graphics/dendrogram.py +79 -34
biotite/sequence/graphics/features.py +133 -99
biotite/sequence/graphics/logo.py +22 -28
biotite/sequence/graphics/plasmid.py +229 -178
biotite/sequence/io/fasta/__init__.py +1 -1
biotite/sequence/io/fasta/convert.py +44 -33
biotite/sequence/io/fasta/file.py +42 -55
biotite/sequence/io/fastq/__init__.py +1 -1
biotite/sequence/io/fastq/convert.py +11 -14
biotite/sequence/io/fastq/file.py +68 -112
biotite/sequence/io/genbank/__init__.py +2 -2
biotite/sequence/io/genbank/annotation.py +12 -20
biotite/sequence/io/genbank/file.py +74 -76
biotite/sequence/io/genbank/metadata.py +74 -62
biotite/sequence/io/genbank/sequence.py +13 -14
biotite/sequence/io/general.py +39 -30
biotite/sequence/io/gff/__init__.py +2 -2
biotite/sequence/io/gff/convert.py +10 -15
biotite/sequence/io/gff/file.py +81 -65
biotite/sequence/phylo/__init__.py +1 -1
biotite/sequence/phylo/nj.cp310-win_amd64.pyd +0 -0
biotite/sequence/phylo/tree.cp310-win_amd64.pyd +0 -0
biotite/sequence/phylo/upgma.cp310-win_amd64.pyd +0 -0
biotite/sequence/profile.py +57 -28
biotite/sequence/search.py +17 -15
biotite/sequence/seqtypes.py +200 -164
biotite/sequence/sequence.py +15 -17
biotite/structure/__init__.py +3 -3
biotite/structure/atoms.py +221 -235
biotite/structure/basepairs.py +260 -271
biotite/structure/bonds.cp310-win_amd64.pyd +0 -0
biotite/structure/bonds.pyx +29 -32
biotite/structure/box.py +67 -71
biotite/structure/celllist.cp310-win_amd64.pyd +0 -0
biotite/structure/chains.py +55 -39
biotite/structure/charges.cp310-win_amd64.pyd +0 -0
biotite/structure/compare.py +32 -32
biotite/structure/density.py +13 -18
biotite/structure/dotbracket.py +20 -22
biotite/structure/error.py +10 -2
biotite/structure/filter.py +82 -77
biotite/structure/geometry.py +130 -119
biotite/structure/graphics/atoms.py +60 -43
biotite/structure/graphics/rna.py +81 -68
biotite/structure/hbond.py +112 -93
biotite/structure/info/__init__.py +0 -2
biotite/structure/info/atoms.py +10 -11
biotite/structure/info/bonds.py +41 -43
biotite/structure/info/ccd.py +4 -5
biotite/structure/info/groups.py +1 -3
biotite/structure/info/masses.py +5 -10
biotite/structure/info/misc.py +1 -1
biotite/structure/info/radii.py +20 -20
biotite/structure/info/standardize.py +15 -26
biotite/structure/integrity.py +18 -71
biotite/structure/io/__init__.py +3 -4
biotite/structure/io/dcd/__init__.py +1 -1
biotite/structure/io/dcd/file.py +22 -20
biotite/structure/io/general.py +47 -61
biotite/structure/io/gro/__init__.py +1 -1
biotite/structure/io/gro/file.py +73 -72
biotite/structure/io/mol/__init__.py +1 -1
biotite/structure/io/mol/convert.py +8 -11
biotite/structure/io/mol/ctab.py +37 -36
biotite/structure/io/mol/header.py +14 -10
biotite/structure/io/mol/mol.py +9 -53
biotite/structure/io/mol/sdf.py +47 -50
biotite/structure/io/netcdf/__init__.py +1 -1
biotite/structure/io/netcdf/file.py +24 -23
biotite/structure/io/pdb/__init__.py +1 -1
biotite/structure/io/pdb/convert.py +32 -20
biotite/structure/io/pdb/file.py +151 -172
biotite/structure/io/pdb/hybrid36.cp310-win_amd64.pyd +0 -0
biotite/structure/io/pdbqt/__init__.py +1 -1
biotite/structure/io/pdbqt/convert.py +17 -11
biotite/structure/io/pdbqt/file.py +128 -80
biotite/structure/io/pdbx/__init__.py +1 -2
biotite/structure/io/pdbx/bcif.py +36 -44
biotite/structure/io/pdbx/cif.py +64 -62
biotite/structure/io/pdbx/component.py +10 -16
biotite/structure/io/pdbx/convert.py +235 -246
biotite/structure/io/pdbx/encoding.cp310-win_amd64.pyd +0 -0
biotite/structure/io/trajfile.py +76 -93
biotite/structure/io/trr/__init__.py +1 -1
biotite/structure/io/trr/file.py +12 -15
biotite/structure/io/xtc/__init__.py +1 -1
biotite/structure/io/xtc/file.py +11 -14
biotite/structure/mechanics.py +9 -11
biotite/structure/molecules.py +3 -4
biotite/structure/pseudoknots.py +53 -67
biotite/structure/rdf.py +23 -21
biotite/structure/repair.py +137 -86
biotite/structure/residues.py +26 -16
biotite/structure/sasa.cp310-win_amd64.pyd +0 -0
biotite/structure/{resutil.py → segments.py} +24 -23
biotite/structure/sequence.py +10 -11
biotite/structure/sse.py +100 -119
biotite/structure/superimpose.py +39 -77
biotite/structure/transform.py +97 -71
biotite/structure/util.py +11 -13
biotite/version.py +2 -2
biotite/visualize.py +69 -55
{biotite-0.41.2.dist-info → biotite-1.0.0.dist-info}/METADATA +5 -5
biotite-1.0.0.dist-info/RECORD +322 -0
biotite/structure/io/ctab.py +0 -72
biotite/structure/io/mmtf/__init__.py +0 -21
biotite/structure/io/mmtf/assembly.py +0 -214
biotite/structure/io/mmtf/convertarray.cp310-win_amd64.pyd +0 -0
biotite/structure/io/mmtf/convertarray.pyx +0 -341
biotite/structure/io/mmtf/convertfile.cp310-win_amd64.pyd +0 -0
biotite/structure/io/mmtf/convertfile.pyx +0 -501
biotite/structure/io/mmtf/decode.cp310-win_amd64.pyd +0 -0
biotite/structure/io/mmtf/decode.pyx +0 -152
biotite/structure/io/mmtf/encode.cp310-win_amd64.pyd +0 -0
biotite/structure/io/mmtf/encode.pyx +0 -183
biotite/structure/io/mmtf/file.py +0 -233
biotite/structure/io/npz/__init__.py +0 -20
biotite/structure/io/npz/file.py +0 -152
biotite/structure/io/pdbx/legacy.py +0 -267
biotite/structure/io/tng/__init__.py +0 -13
biotite/structure/io/tng/file.py +0 -46
biotite/temp.py +0 -86
biotite-0.41.2.dist-info/RECORD +0 -340
{biotite-0.41.2.dist-info → biotite-1.0.0.dist-info}/WHEEL +0 -0
{biotite-0.41.2.dist-info → biotite-1.0.0.dist-info}/licenses/LICENSE.rst +0 -0

biotite/sequence/io/genbank/file.py CHANGED Viewed

@@ -6,14 +6,16 @@ __name__ = "biotite.sequence.io.genbank"
 __author__ = "Patrick Kunzmann"
 __all__ = ["GenBankFile", "MultiFile"]
-#import textwrap
+# import textwrap
 import copy
-#import re
+# import re
 import io
-from ....file import TextFile, InvalidFileError
 from collections import OrderedDict
-#from ...annotation import Location, Feature, Annotation, AnnotatedSequence
-#from ...seqtypes import NucleotideSequence, ProteinSequence
+from biotite.file import InvalidFileError, TextFile
+# from ...annotation import Location, Feature, Annotation, AnnotatedSequence
+# from ...seqtypes import NucleotideSequence, ProteinSequence
 class GenBankFile(TextFile):
@@ -33,7 +35,7 @@ class GenBankFile(TextFile):
     Some fields may occur multiple times, e.g. the *REFERENCE* field.
     A sample GenBank file can be viewed at
     `<https://www.ncbi.nlm.nih.gov/Sitemap/samplerecord.html>`_.
     This class provides a low-level interface for parsing, editing and
     writing GenBank files.
     It works like a list of field entries, where a field consists of the
@@ -47,7 +49,7 @@ class GenBankFile(TextFile):
     The subfields are represented by a dictionary, with subfield names
     being keys and the corresponding lines being values.
     The *FEATURES* and *ORIGIN* fields have no subfields.
     Every entry can be obtained, set and deleted via the index operator.
     Notes
@@ -55,7 +57,7 @@ class GenBankFile(TextFile):
     This class does not support location identifiers with references
     to other Entrez database entries, e.g.
     ``join(1..100,J00194.1:100..202)``.
     Examples
     --------
     Create a GenBank file from scratch:
@@ -79,9 +81,9 @@ class GenBankFile(TextFile):
     ['One line', 'A second line']
     >>> print(subfields)
     OrderedDict([('SUBFIELD1', ['Single Line']), ('SUBFIELD2', ['Two', 'lines'])])
     Adding an additional field:
     >>> file.insert(0, "OTHERFIELD", ["Another line"])
     >>> print(len(file))
     2
@@ -174,18 +176,18 @@ class GenBankFile(TextFile):
         # and names of categories
         self._field_pos = []
         self._find_field_indices()
     @classmethod
     def read(cls, file):
         """
         Read a GenBank file.
         Parameters
         ----------
         file : file-like object or str
             The file to be read.
             Alternatively a file path can be supplied.
         Returns
         -------
         file_object : GenBankFile
@@ -194,16 +196,16 @@ class GenBankFile(TextFile):
         file = super().read(file)
         file._find_field_indices()
         return file
     def get_fields(self, name):
         """
         Get all *GenBank* fields associated with a given field name.
         Parameters
         ----------
         name : str
             The field name.
         Returns
         -------
         fields : list of (list of str, OrderedDict of str -> str)
@@ -218,17 +220,17 @@ class GenBankFile(TextFile):
         indices = self.get_indices(name)
         # Omit the field name
         return [self[i][1:] for i in indices]
     def get_indices(self, name):
         """
         Get the indices to all *GenBank* fields associated with a given
         field name.
         Parameters
         ----------
         name : str
             The field name.
         Returns
         -------
         fields : list of int
@@ -242,7 +244,7 @@ class GenBankFile(TextFile):
             if fname == name:
                 indices.append(i)
         return indices
     def set_field(self, name, content, subfield_dict=None):
         """
         Set a *GenBank* field with the given content.
@@ -250,7 +252,7 @@ class GenBankFile(TextFile):
         If the field already exists in the file, the field is
         overwritten, otherwise a new field is created at the end of
         the file.
         Parameters
         ----------
         name : str
@@ -261,7 +263,7 @@ class GenBankFile(TextFile):
             The subfields of the field.
             The dictionary maps subfield names to the content lines of
             the respective subfield.
         Raises
         ------
         InvalidFileError
@@ -283,13 +285,13 @@ class GenBankFile(TextFile):
     def __getitem__(self, index):
         index = self._translate_idx(index)
         start, stop, name = self._field_pos[index]
         if name in ["FEATURES", "ORIGIN"]:
             # For those two fields return the complete lines,
             # beginning with the line after the field name
-            content = self._get_field_content(start+1, stop, indent=0)
+            content = self._get_field_content(start + 1, stop, indent=0)
             subfield_dict = OrderedDict()
         else:
             # For all metadata fields use the
             # standard GenBank indentation (=12)
@@ -297,11 +299,11 @@ class GenBankFile(TextFile):
             subfield_dict = OrderedDict()
             subfield_start = None
             first_subfield_start = None
-            for i in range(start+1, stop):
+            header = None
+            for i in range(start + 1, stop):
                 line = self.lines[i]
-                # Check if line contains a new subfield
-                # (Header beginning from first column)
                 if len(line) != 0 and line[:12].strip() != "":
+                    # New header -> new subfield
                     if first_subfield_start is None:
                         first_subfield_start = i
                     # Store previous subfield
@@ -320,12 +322,10 @@ class GenBankFile(TextFile):
             # that are not part of a subfield
             if first_subfield_start is not None:
                 stop = first_subfield_start
-            content = self._get_field_content(
-                start, stop, indent=12
-            )
+            content = self._get_field_content(start, stop, indent=12)
         return name, content, subfield_dict
     def __setitem__(self, index, item):
         index = self._translate_idx(index)
         if not isinstance(item, tuple):
@@ -342,7 +342,7 @@ class GenBankFile(TextFile):
                 "Expected a tuple of name, content and optionally subfields"
             )
         inserted_lines = self._to_lines(name, content, subfields)
         # Stop of field to be replaced is start of new field
         start, old_stop, _ = self._field_pos[index]
         # If not the last element is set,
@@ -355,12 +355,12 @@ class GenBankFile(TextFile):
         # Shift the start/stop indices of the following fields
         # by the amount of created fields
         shift = len(inserted_lines) - (old_stop - start)
-        for i in range(index+1, len(self._field_pos)):
+        for i in range(index + 1, len(self._field_pos)):
             old_start, old_stop, fname = self._field_pos[i]
-            self._field_pos[i] = old_start+shift, old_stop+shift, fname
+            self._field_pos[i] = old_start + shift, old_stop + shift, fname
         # Add new entry
-        self._field_pos[index] = start, start+len(inserted_lines), name.upper()
+        self._field_pos[index] = start, start + len(inserted_lines), name.upper()
     def __delitem__(self, index):
         index = self._translate_idx(index)
         start, stop, _ = self._field_pos[index]
@@ -369,17 +369,17 @@ class GenBankFile(TextFile):
         shift = stop - start
         for i in range(index, len(self._field_pos)):
             old_start, old_stop, name = self._field_pos[i]
-            self._field_pos[i] = old_start-shift, old_stop-shift, name
-        del self.lines[start : stop]
+            self._field_pos[i] = old_start - shift, old_stop - shift, name
+        del self.lines[start:stop]
         del self._field_pos[index]
     def __len__(self):
         return len(self._field_pos)
     def insert(self, index, name, content, subfields=None):
         """
         Insert a *GenBank* field at the given position.
         Parameters
         ----------
         index : int
@@ -398,12 +398,12 @@ class GenBankFile(TextFile):
         """
         index = self._translate_idx(index, length_exclusive=False)
         inserted_lines = self._to_lines(name, content, subfields)
         # Stop of previous field is start of new field
         if index == 0:
             start = 0
         else:
-            _, start, _ = self._field_pos[index-1]
+            _, start, _ = self._field_pos[index - 1]
         # If the new lines are not inserted at the end,
         # the following lines need to be added, too
         if start is not len(self.lines):
@@ -416,17 +416,16 @@ class GenBankFile(TextFile):
         shift = len(inserted_lines)
         for i in range(index, len(self._field_pos)):
             old_start, old_stop, fname = self._field_pos[i]
-            self._field_pos[i] = old_start+shift, old_stop+shift, fname
+            self._field_pos[i] = old_start + shift, old_stop + shift, fname
         # Add new entry
         self._field_pos.insert(
-            index,
-            (start, start+len(inserted_lines), name.upper())
+            index, (start, start + len(inserted_lines), name.upper())
         )
     def append(self, name, content, subfields=None):
         """
         Create a new *GenBank* field at the end of the file.
         Parameters
         ----------
         name : str
@@ -440,7 +439,6 @@ class GenBankFile(TextFile):
         """
         self.insert(len(self), name, content, subfields)
     def _find_field_indices(self):
         """
         Identify the start and exclusive stop indices of lines
@@ -469,10 +467,10 @@ class GenBankFile(TextFile):
     def _get_field_content(self, start, stop, indent):
         if indent == 0:
-            return self.lines[start : stop]
+            return self.lines[start:stop]
         else:
-            return [line[12:] for line in self.lines[start : stop]]
+            return [line[12:] for line in self.lines[start:stop]]
     def _to_lines(self, name, content, subfields):
         """
         Convert the field name, field content und subfield dictionary
@@ -480,22 +478,22 @@ class GenBankFile(TextFile):
         """
         if subfields is None:
             subfields = {}
         name = name.strip().upper()
         if len(name) == 0:
-            raise ValueError(f"Must give a non emtpy name")
-        subfields = OrderedDict({
-            subfield_name.upper().strip() : subfield_lines
-            for subfield_name, subfield_lines in subfields.items()
-        })
+            raise ValueError("Must give a non emtpy name")
+        subfields = OrderedDict(
+            {
+                subfield_name.upper().strip(): subfield_lines
+                for subfield_name, subfield_lines in subfields.items()
+            }
+        )
         # Create lines for new field
         if name == "FEATURES":
             # Header line plus all actual feature lines
             lines = copy.copy(content)
-            lines.insert(
-                0, "FEATURES" + " "*13 + "Location/Qualifiers"
-            )
+            lines.insert(0, "FEATURES" + " " * 13 + "Location/Qualifiers")
         elif name == "ORIGIN":
             # Header line plus all actual sequence lines
             lines = copy.copy(content)
@@ -504,19 +502,19 @@ class GenBankFile(TextFile):
             name_column = []
             content_column = []
             # Create a line for the field name and empty lines
-            # for each additional line required by the content
-            name_column += [name] + [""] * (len(content)-1)
+            # for each additional line required by the content
+            name_column += [name] + [""] * (len(content) - 1)
             content_column += content
             for subfield_name, subfield_lines in subfields.items():
-                name_column += ["  " + subfield_name] \
-                               + [""] * (len(subfield_lines)-1)
+                name_column += ["  " + subfield_name] + [""] * (len(subfield_lines) - 1)
                 content_column += subfield_lines
-            lines = [f"{n_col:12}{c_col}" for n_col, c_col
-                              in zip(name_column, content_column)]
+            lines = [
+                f"{n_col:12}{c_col}"
+                for n_col, c_col in zip(name_column, content_column)
+            ]
         return lines
     def _translate_idx(self, index, length_exclusive=True):
         """
         Check index boundaries and convert negative index to positive
@@ -539,15 +537,15 @@ class MultiFile(TextFile):
     """
     This class represents a file in *GenBank* or *GenPept* format,
     that contains multiple entries, for more than one UID.
     The information for each UID are appended to each other in such a
     file.
     Objects of this class can be iterated to obtain a
     :class:`GenBankFile` for each entry in the file.
     Examples
     --------
     >>> import os.path
     >>> file_name = fetch_single_file(
     ...     ["1L2Y_A", "3O5R_A", "5UGO_A"],
@@ -568,8 +566,8 @@ class MultiFile(TextFile):
             line = self.lines[i]
             if line.strip() == "//":
                 # Create file with lines corresponding to that file
-                file_content = "\n".join(self.lines[start_i : i+1])
+                file_content = "\n".join(self.lines[start_i : i + 1])
                 file = GenBankFile.read(io.StringIO(file_content))
                 # Reset file start index
                 start_i = i
-                yield file
+                yield file

biotite/sequence/io/genbank/metadata.py CHANGED Viewed

@@ -8,17 +8,24 @@ Functions for obtaining metadata fields of a GenBank file.
 __name__ = "biotite.sequence.io.genbank"
 __author__ = "Patrick Kunzmann, Natasha Jaffe"
-__all__ = ["get_locus", "get_definition", "get_accession", "get_version",
-           "get_gi", "get_db_link", "get_source",
-           "set_locus"]
+__all__ = [
+    "get_locus",
+    "get_definition",
+    "get_accession",
+    "get_version",
+    "get_gi",
+    "get_db_link",
+    "get_source",
+    "set_locus",
+]
+from biotite.file import InvalidFileError
-from ....file import InvalidFileError
-from .file import GenBankFile
 def get_locus(gb_file):
     """
     Parse the *LOCUS* field of a GenBank or GenPept file.
     Parameters
     ----------
     gb_file : GenBankFile
@@ -39,10 +46,10 @@ def get_locus(gb_file):
         The GenBank division to which the file belongs.
     date : str, optional
         The date of last modification.
     Examples
     --------
     >>> import os.path
     >>> file = GenBankFile.read(os.path.join(path_to_sequences, "ec_bl21.gb"))
     >>> name, length, mol_type, is_circular, division, date = get_locus(file)
@@ -68,59 +75,57 @@ def get_locus(gb_file):
     # The first field will always be the ID
     name = fields[0]
-    # The second field will always be the length followed
+    # The second field will always be the length followed
     # by units (eg 1224 aa)
     length = int(fields[1])
-    # The third field *should* be the molecular type
+    # The third field *should* be the molecular type
     # but sometimes this is missing.  This gets tricky
     # because sometimes the next field, circular/linear,
     # is missing, too. The field after that, division,
     # is a 3 letter all caps token. Unfortunately, mol_type
-    # is also often a 3 letter all caps token (eg DNA)!
+    # is also often a 3 letter all caps token (eg DNA)!
     # Fortunately, GenBank publishes the set list of divisions
     # here: https://www.ncbi.nlm.nih.gov/genbank/samplerecord ,
     # so we can check against that set when determining whether
     # the current token represents the molecular type.
     divisions = (
-        'PRI', # primate sequences
-        'ROD', # rodent sequences
-        'MAM', # other mammalian sequences
-        'VRT', # other vertebrate sequences
-        'INV', # invertebrate sequences
-        'PLN', # plant, fungal, and algal sequences
-        'BCT', # bacterial sequences
-        'VRL', # viral sequences
-        'PHG', # bacteriophage sequences
-        'SYN', # synthetic sequences
-        'UNA', # unannotated sequences
-        'EST', # EST sequences (expressed sequence tags)
-        'PAT', # patent sequences
-        'STS', # STS sequences (sequence tagged sites)
-        'GSS', # GSS sequences (genome survey sequences)
-        'HTG', # HTG sequences (high-throughput genomic sequences)
-        'HTC', # unfinished high-throughput cDNA sequencing
-        'ENV', # environmental sampling sequences
-        'CON',
+        "PRI",  # primate sequences
+        "ROD",  # rodent sequences
+        "MAM",  # other mammalian sequences
+        "VRT",  # other vertebrate sequences
+        "INV",  # invertebrate sequences
+        "PLN",  # plant, fungal, and algal sequences
+        "BCT",  # bacterial sequences
+        "VRL",  # viral sequences
+        "PHG",  # bacteriophage sequences
+        "SYN",  # synthetic sequences
+        "UNA",  # unannotated sequences
+        "EST",  # EST sequences (expressed sequence tags)
+        "PAT",  # patent sequences
+        "STS",  # STS sequences (sequence tagged sites)
+        "GSS",  # GSS sequences (genome survey sequences)
+        "HTG",  # HTG sequences (high-throughput genomic sequences)
+        "HTC",  # unfinished high-throughput cDNA sequencing
+        "ENV",  # environmental sampling sequences
+        "CON",
     )
-    # NOTE: Remember that fields[2] is the unit for length,
+    # NOTE: Remember that fields[2] is the unit for length,
     #       eg bp or aa, so we move to fields[3] here.
-    if fields[3] not in ('linear', 'circular') \
-        and fields[3] not in divisions:
+    if fields[3] not in ("linear", "circular") and fields[3] not in divisions:
         mol_type = fields[3]
         next_idx = 4
     else:
         mol_type = None
         next_idx = 3
-    # The next field should be the token 'linear' or 'circular',
+    # The next field should be the token 'linear' or 'circular',
     # but sometimes this is missing
-    if 'linear' == fields[next_idx]:
+    if "linear" == fields[next_idx]:
         is_circular = False
         next_idx += 1
-    elif 'circular' == fields[next_idx]:
+    elif "circular" == fields[next_idx]:
         is_circular = True
         next_idx += 1
     else:
@@ -136,23 +141,24 @@ def get_locus(gb_file):
     return name, length, mol_type, is_circular, division, date
 def get_definition(gb_file):
     """
     Parse the *DEFINITION* field of a GenBank or GenPept file.
     Parameters
     ----------
     gb_file : GenBankFile
         The GenBank file to read the *DEFINITION* field from.
     Returns
     -------
     definition : str
         Content of the *DEFINITION* field.
     Examples
     --------
     >>> import os.path
     >>> file = GenBankFile.read(os.path.join(path_to_sequences, "ec_bl21.gb"))
     >>> print(get_definition(file))
@@ -161,23 +167,24 @@ def get_definition(gb_file):
     lines, _ = _expect_single_field(gb_file, "DEFINITION")
     return " ".join([line.strip() for line in lines])
 def get_accession(gb_file):
     """
     Parse the *ACCESSION* field of a GenBank or GenPept file.
     Parameters
     ----------
     gb_file : GenBankFile
         The GenBank file to read the *ACCESSION* field from.
     Returns
     -------
     accession : str
         The accession ID of the file.
     Examples
     --------
     >>> import os.path
     >>> file = GenBankFile.read(os.path.join(path_to_sequences, "ec_bl21.gb"))
     >>> print(get_accession(file))
@@ -187,16 +194,17 @@ def get_accession(gb_file):
     # 'ACCESSION' field has only one line
     return lines[0]
 def get_version(gb_file):
     """
     Parse the version from the *VERSION* field of a GenBank or GenPept
     file.
     Parameters
     ----------
     gb_file : GenBankFile
         The GenBank file to read the *VERSION* field from.
     Returns
     -------
     version : str
@@ -206,16 +214,17 @@ def get_version(gb_file):
     # 'VERSION' field has only one line
     return lines[0].split()[0]
 def get_gi(gb_file):
     """
     Parse the GI from the *VERSION* field of a GenBank or GenPept
     file.
     Parameters
     ----------
     gb_file : GenBankFile
         The GenBank file to read the *VERSION* field from.
     Returns
     -------
     gi : str
@@ -229,24 +238,25 @@ def get_gi(gb_file):
     # Truncate GI
     return int(version_info[1][3:])
 def get_db_link(gb_file):
     """
     Parse the *DBLINK* field of a GenBank or GenPept file.
     Parameters
     ----------
     gb_file : GenBankFile
         The GenBank file to read the *DBLINK* field from.
     Returns
     -------
     link_dict : dict
         A dictionary storing the database links, with the database
         name as key, and the corresponding ID as value.
     Examples
     --------
     >>> import os.path
     >>> file = GenBankFile.read(os.path.join(path_to_sequences, "ec_bl21.gb"))
     >>> for key, val in get_db_link(file).items():
@@ -265,12 +275,12 @@ def get_db_link(gb_file):
 def get_source(gb_file):
     """
     Parse the *SOURCE* field of a GenBank or GenPept file.
     Parameters
     ----------
     gb_file : GenBankFile
         The GenBank file to read the *SOURCE* field from.
     Returns
     -------
     accession : str
@@ -290,12 +300,12 @@ def _expect_single_field(gb_file, name):
     return fields[0]
-def set_locus(gb_file, name, length, mol_type=None, is_circular=False,
-              division=None, date=None):
+def set_locus(
+    gb_file, name, length, mol_type=None, is_circular=False, division=None, date=None
+):
     """
     Set the *LOCUS* field of a GenBank file.
     Parameters
     ----------
     gb_file : GenBankFile
@@ -319,6 +329,8 @@ def set_locus(gb_file, name, length, mol_type=None, is_circular=False,
     circularity = "circular" if is_circular else "linear"
     division = "" if division is None else division
     date = "" if date is None else date
-    line = f"{name:18} {length:>9} {restype_abbr} {mol_type:^10} " \
-           f"{circularity:8} {division:3} {date:11}"
-    gb_file.set_field("LOCUS", [line])
+    line = (
+        f"{name:18} {length:>9} {restype_abbr} {mol_type:^10} "
+        f"{circularity:8} {division:3} {date:11}"
+    )
+    gb_file.set_field("LOCUS", [line])