PyPI - biotite - Versions diffs - 0.41.2__cp311-cp311-win_amd64.whl → 1.0.1__cp311-cp311-win_amd64.whl - Mend

biotite 0.41.2__cp311-cp311-win_amd64.whl → 1.0.1__cp311-cp311-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of biotite might be problematic. Click here for more details.

Files changed (205) hide show

biotite/__init__.py +2 -3
biotite/application/__init__.py +1 -1
biotite/application/application.py +20 -10
biotite/application/autodock/__init__.py +1 -1
biotite/application/autodock/app.py +74 -79
biotite/application/blast/__init__.py +1 -1
biotite/application/blast/alignment.py +19 -10
biotite/application/blast/webapp.py +92 -85
biotite/application/clustalo/__init__.py +1 -1
biotite/application/clustalo/app.py +46 -61
biotite/application/dssp/__init__.py +1 -1
biotite/application/dssp/app.py +8 -11
biotite/application/localapp.py +62 -60
biotite/application/mafft/__init__.py +1 -1
biotite/application/mafft/app.py +16 -22
biotite/application/msaapp.py +78 -89
biotite/application/muscle/__init__.py +1 -1
biotite/application/muscle/app3.py +50 -64
biotite/application/muscle/app5.py +23 -31
biotite/application/sra/__init__.py +1 -1
biotite/application/sra/app.py +64 -68
biotite/application/tantan/__init__.py +1 -1
biotite/application/tantan/app.py +22 -45
biotite/application/util.py +7 -9
biotite/application/viennarna/rnaalifold.py +34 -28
biotite/application/viennarna/rnafold.py +24 -39
biotite/application/viennarna/rnaplot.py +36 -21
biotite/application/viennarna/util.py +17 -12
biotite/application/webapp.py +13 -14
biotite/copyable.py +13 -13
biotite/database/__init__.py +1 -1
biotite/database/entrez/__init__.py +1 -1
biotite/database/entrez/check.py +2 -3
biotite/database/entrez/dbnames.py +7 -5
biotite/database/entrez/download.py +55 -49
biotite/database/entrez/key.py +1 -1
biotite/database/entrez/query.py +62 -23
biotite/database/error.py +2 -1
biotite/database/pubchem/__init__.py +1 -1
biotite/database/pubchem/download.py +43 -45
biotite/database/pubchem/error.py +2 -2
biotite/database/pubchem/query.py +34 -31
biotite/database/pubchem/throttle.py +3 -4
biotite/database/rcsb/__init__.py +1 -1
biotite/database/rcsb/download.py +44 -52
biotite/database/rcsb/query.py +85 -80
biotite/database/uniprot/check.py +6 -3
biotite/database/uniprot/download.py +6 -11
biotite/database/uniprot/query.py +115 -31
biotite/file.py +12 -31
biotite/sequence/__init__.py +3 -3
biotite/sequence/align/__init__.py +2 -2
biotite/sequence/align/alignment.py +99 -90
biotite/sequence/align/banded.cp311-win_amd64.pyd +0 -0
biotite/sequence/align/buckets.py +12 -10
biotite/sequence/align/cigar.py +43 -52
biotite/sequence/align/kmeralphabet.cp311-win_amd64.pyd +0 -0
biotite/sequence/align/kmeralphabet.pyx +55 -51
biotite/sequence/align/kmersimilarity.cp311-win_amd64.pyd +0 -0
biotite/sequence/align/kmertable.cp311-win_amd64.pyd +0 -0
biotite/sequence/align/kmertable.pyx +3 -2
biotite/sequence/align/localgapped.cp311-win_amd64.pyd +0 -0
biotite/sequence/align/localungapped.cp311-win_amd64.pyd +0 -0
biotite/sequence/align/matrix.py +81 -82
biotite/sequence/align/multiple.cp311-win_amd64.pyd +0 -0
biotite/sequence/align/multiple.pyx +1 -1
biotite/sequence/align/pairwise.cp311-win_amd64.pyd +0 -0
biotite/sequence/align/permutation.cp311-win_amd64.pyd +0 -0
biotite/sequence/align/permutation.pyx +12 -4
biotite/sequence/align/selector.cp311-win_amd64.pyd +0 -0
biotite/sequence/align/selector.pyx +52 -54
biotite/sequence/align/statistics.py +32 -33
biotite/sequence/align/tracetable.cp311-win_amd64.pyd +0 -0
biotite/sequence/alphabet.py +51 -65
biotite/sequence/annotation.py +78 -77
biotite/sequence/codec.cp311-win_amd64.pyd +0 -0
biotite/sequence/codon.py +90 -79
biotite/sequence/graphics/__init__.py +1 -1
biotite/sequence/graphics/alignment.py +184 -103
biotite/sequence/graphics/colorschemes.py +10 -12
biotite/sequence/graphics/dendrogram.py +79 -34
biotite/sequence/graphics/features.py +133 -99
biotite/sequence/graphics/logo.py +22 -28
biotite/sequence/graphics/plasmid.py +229 -178
biotite/sequence/io/fasta/__init__.py +1 -1
biotite/sequence/io/fasta/convert.py +44 -33
biotite/sequence/io/fasta/file.py +42 -55
biotite/sequence/io/fastq/__init__.py +1 -1
biotite/sequence/io/fastq/convert.py +11 -14
biotite/sequence/io/fastq/file.py +68 -112
biotite/sequence/io/genbank/__init__.py +2 -2
biotite/sequence/io/genbank/annotation.py +12 -20
biotite/sequence/io/genbank/file.py +74 -76
biotite/sequence/io/genbank/metadata.py +74 -62
biotite/sequence/io/genbank/sequence.py +13 -14
biotite/sequence/io/general.py +39 -30
biotite/sequence/io/gff/__init__.py +2 -2
biotite/sequence/io/gff/convert.py +10 -15
biotite/sequence/io/gff/file.py +81 -65
biotite/sequence/phylo/__init__.py +1 -1
biotite/sequence/phylo/nj.cp311-win_amd64.pyd +0 -0
biotite/sequence/phylo/tree.cp311-win_amd64.pyd +0 -0
biotite/sequence/phylo/upgma.cp311-win_amd64.pyd +0 -0
biotite/sequence/profile.py +57 -28
biotite/sequence/search.py +17 -15
biotite/sequence/seqtypes.py +200 -164
biotite/sequence/sequence.py +15 -17
biotite/structure/__init__.py +3 -3
biotite/structure/atoms.py +246 -236
biotite/structure/basepairs.py +260 -271
biotite/structure/bonds.cp311-win_amd64.pyd +0 -0
biotite/structure/bonds.pyx +29 -32
biotite/structure/box.py +67 -71
biotite/structure/celllist.cp311-win_amd64.pyd +0 -0
biotite/structure/chains.py +55 -39
biotite/structure/charges.cp311-win_amd64.pyd +0 -0
biotite/structure/compare.py +32 -32
biotite/structure/density.py +13 -18
biotite/structure/dotbracket.py +20 -22
biotite/structure/error.py +10 -2
biotite/structure/filter.py +83 -78
biotite/structure/geometry.py +130 -119
biotite/structure/graphics/atoms.py +60 -43
biotite/structure/graphics/rna.py +81 -68
biotite/structure/hbond.py +112 -93
biotite/structure/info/__init__.py +0 -2
biotite/structure/info/atoms.py +10 -11
biotite/structure/info/bonds.py +41 -43
biotite/structure/info/ccd.py +4 -5
biotite/structure/info/groups.py +1 -3
biotite/structure/info/masses.py +5 -10
biotite/structure/info/misc.py +1 -1
biotite/structure/info/radii.py +20 -20
biotite/structure/info/standardize.py +15 -26
biotite/structure/integrity.py +18 -71
biotite/structure/io/__init__.py +3 -4
biotite/structure/io/dcd/__init__.py +1 -1
biotite/structure/io/dcd/file.py +22 -20
biotite/structure/io/general.py +47 -61
biotite/structure/io/gro/__init__.py +1 -1
biotite/structure/io/gro/file.py +73 -72
biotite/structure/io/mol/__init__.py +1 -1
biotite/structure/io/mol/convert.py +8 -11
biotite/structure/io/mol/ctab.py +37 -36
biotite/structure/io/mol/header.py +14 -10
biotite/structure/io/mol/mol.py +9 -53
biotite/structure/io/mol/sdf.py +47 -50
biotite/structure/io/netcdf/__init__.py +1 -1
biotite/structure/io/netcdf/file.py +24 -23
biotite/structure/io/pdb/__init__.py +1 -1
biotite/structure/io/pdb/convert.py +32 -20
biotite/structure/io/pdb/file.py +151 -172
biotite/structure/io/pdb/hybrid36.cp311-win_amd64.pyd +0 -0
biotite/structure/io/pdbqt/__init__.py +1 -1
biotite/structure/io/pdbqt/convert.py +17 -11
biotite/structure/io/pdbqt/file.py +128 -80
biotite/structure/io/pdbx/__init__.py +1 -2
biotite/structure/io/pdbx/bcif.py +36 -44
biotite/structure/io/pdbx/cif.py +140 -110
biotite/structure/io/pdbx/component.py +10 -16
biotite/structure/io/pdbx/convert.py +260 -258
biotite/structure/io/pdbx/encoding.cp311-win_amd64.pyd +0 -0
biotite/structure/io/trajfile.py +90 -107
biotite/structure/io/trr/__init__.py +1 -1
biotite/structure/io/trr/file.py +12 -15
biotite/structure/io/xtc/__init__.py +1 -1
biotite/structure/io/xtc/file.py +11 -14
biotite/structure/mechanics.py +9 -11
biotite/structure/molecules.py +3 -4
biotite/structure/pseudoknots.py +53 -67
biotite/structure/rdf.py +23 -21
biotite/structure/repair.py +137 -86
biotite/structure/residues.py +26 -16
biotite/structure/sasa.cp311-win_amd64.pyd +0 -0
biotite/structure/{resutil.py → segments.py} +24 -23
biotite/structure/sequence.py +10 -11
biotite/structure/sse.py +100 -119
biotite/structure/superimpose.py +39 -77
biotite/structure/transform.py +97 -71
biotite/structure/util.py +11 -13
biotite/version.py +2 -2
biotite/visualize.py +69 -55
{biotite-0.41.2.dist-info → biotite-1.0.1.dist-info}/METADATA +6 -5
biotite-1.0.1.dist-info/RECORD +322 -0
biotite/structure/io/ctab.py +0 -72
biotite/structure/io/mmtf/__init__.py +0 -21
biotite/structure/io/mmtf/assembly.py +0 -214
biotite/structure/io/mmtf/convertarray.cp311-win_amd64.pyd +0 -0
biotite/structure/io/mmtf/convertarray.pyx +0 -341
biotite/structure/io/mmtf/convertfile.cp311-win_amd64.pyd +0 -0
biotite/structure/io/mmtf/convertfile.pyx +0 -501
biotite/structure/io/mmtf/decode.cp311-win_amd64.pyd +0 -0
biotite/structure/io/mmtf/decode.pyx +0 -152
biotite/structure/io/mmtf/encode.cp311-win_amd64.pyd +0 -0
biotite/structure/io/mmtf/encode.pyx +0 -183
biotite/structure/io/mmtf/file.py +0 -233
biotite/structure/io/npz/__init__.py +0 -20
biotite/structure/io/npz/file.py +0 -152
biotite/structure/io/pdbx/legacy.py +0 -267
biotite/structure/io/tng/__init__.py +0 -13
biotite/structure/io/tng/file.py +0 -46
biotite/temp.py +0 -86
biotite-0.41.2.dist-info/RECORD +0 -340
{biotite-0.41.2.dist-info → biotite-1.0.1.dist-info}/WHEEL +0 -0
{biotite-0.41.2.dist-info → biotite-1.0.1.dist-info}/licenses/LICENSE.rst +0 -0

biotite/sequence/io/genbank/sequence.py CHANGED Viewed

@@ -8,16 +8,19 @@ Functions for converting a sequence from/to a GenBank file.
 __name__ = "biotite.sequence.io.genbank"
 __author__ = "Patrick Kunzmann"
-__all__ = ["get_raw_sequence", "get_sequence", "get_annotated_sequence",
-           "set_sequence", "set_annotated_sequence"]
+__all__ = [
+    "get_raw_sequence",
+    "get_sequence",
+    "get_annotated_sequence",
+    "set_sequence",
+    "set_annotated_sequence",
+]
 import re
-from ....file import InvalidFileError
-from ...seqtypes import ProteinSequence, NucleotideSequence
-from ...annotation import AnnotatedSequence
-from .file import GenBankFile
-from .annotation import get_annotation, set_annotation
+from biotite.file import InvalidFileError
+from biotite.sequence.annotation import AnnotatedSequence
+from biotite.sequence.io.genbank.annotation import get_annotation, set_annotation
+from biotite.sequence.seqtypes import NucleotideSequence, ProteinSequence
 _SYMBOLS_PER_CHUNK = 10
 _SEQ_CHUNKS_PER_LINE = 6
@@ -112,7 +115,7 @@ def _convert_seq_str(seq_str, format):
     if len(seq_str) == 0:
         raise InvalidFileError("The file's 'ORIGIN' field is empty")
     if format == "gb":
-        return NucleotideSequence(seq_str.replace("U","T").replace("X","N"))
+        return NucleotideSequence(seq_str.replace("U", "T").replace("X", "N"))
     elif format == "gp":
         return ProteinSequence(seq_str.replace("U", "C").replace("O", "K"))
     else:
@@ -125,8 +128,6 @@ def _get_seq_start(origin_content):
     return int(origin_content[0].split()[0])
 def set_sequence(gb_file, sequence, sequence_start=1):
     """
     Set the *ORIGIN* field of a GenBank file with a sequence.
@@ -167,6 +168,4 @@ def set_annotated_sequence(gb_file, annot_sequence):
         The annotated sequence that is put into the GenBank file.
     """
     set_annotation(gb_file, annot_sequence.annotation)
-    set_sequence(
-        gb_file, annot_sequence.sequence, annot_sequence.sequence_start
-    )
+    set_sequence(gb_file, annot_sequence.sequence, annot_sequence.sequence_start)

biotite/sequence/io/general.py CHANGED Viewed

@@ -9,31 +9,27 @@ general sequence files.
 __name__ = "biotite.sequence.io"
 __author__ = "Patrick Kunzmann"
-__all__ = ["load_sequence", "save_sequence",
-           "load_sequences", "save_sequences"]
+__all__ = ["load_sequence", "save_sequence", "load_sequences", "save_sequences"]
-import itertools
 import os.path
-import io
 from collections import OrderedDict
 import numpy as np
-from ..seqtypes import NucleotideSequence, ProteinSequence
-from ..alphabet import Alphabet
+from biotite.sequence.seqtypes import NucleotideSequence
 def load_sequence(file_path):
     """
     Load a sequence from a sequence file without the need
     to manually instantiate a :class:`File` object.
     Internally this function uses a :class:`File` object, based on the
     file extension.
     Parameters
     ----------
     file_path : str
         The path to the sequence file.
     Returns
     -------
     sequence : Sequence
@@ -42,11 +38,13 @@ def load_sequence(file_path):
     # We only need the suffix here
     filename, suffix = os.path.splitext(file_path)
     if suffix in [".fasta", ".fa", ".mpfa", ".fna", ".fsa"]:
-        from .fasta import FastaFile, get_sequence
+        from biotite.sequence.io.fasta import FastaFile, get_sequence
         file = FastaFile.read(file_path)
         return get_sequence(file)
     elif suffix in [".fastq", ".fq"]:
-        from .fastq import FastqFile
+        from biotite.sequence.io.fastq import FastqFile
         # Quality scores are irrelevant for this function
         # -> Offset is irrelevant
         file = FastqFile.read(file_path, offset="Sanger")
@@ -56,7 +54,8 @@ def load_sequence(file_path):
             break
         return sequence
     elif suffix in [".gb", ".gbk", ".gp"]:
-        from .genbank import GenBankFile, get_sequence
+        from biotite.sequence.io.genbank import GenBankFile, get_sequence
         format = "gp" if suffix == ".gp" else "gb"
         file = GenBankFile.read(file_path)
         return get_sequence(file, format)
@@ -68,10 +67,10 @@ def save_sequence(file_path, sequence):
     """
     Save a sequence into a sequence file without the need
     to manually instantiate a :class:`File` object.
     Internally this function uses a :class:`File` object, based on the
     given file extension.
     Parameters
     ----------
     file_path : str
@@ -82,12 +81,14 @@ def save_sequence(file_path, sequence):
     # We only need the suffix here
     filename, suffix = os.path.splitext(file_path)
     if suffix in [".fasta", ".fa", ".mpfa", ".fna", ".fsa"]:
-        from .fasta import FastaFile, set_sequence
+        from biotite.sequence.io.fasta import FastaFile, set_sequence
         file = FastaFile()
         set_sequence(file, sequence)
         file.write(file_path)
     elif suffix in [".fastq", ".fq"]:
-        from .fastq import FastqFile
+        from biotite.sequence.io.fastq import FastqFile
         # Quality scores are irrelevant for this function
         # -> Offset is irrelevant
         file = FastqFile(offset="Sanger")
@@ -96,7 +97,8 @@ def save_sequence(file_path, sequence):
         file["sequence"] = str(sequence), scores
         file.write(file_path)
     elif suffix in [".gb", ".gbk", ".gp"]:
-        from .genbank import GenBankFile, set_locus, set_sequence
+        from biotite.sequence.io.genbank import GenBankFile, set_locus, set_sequence
         file = GenBankFile()
         set_locus(file, "sequence", len(sequence))
         set_sequence(file, sequence)
@@ -109,37 +111,42 @@ def load_sequences(file_path):
     """
     Load multiple sequences from a sequence file without the need
     to manually instantiate a :class:`File` object.
     Internally this function uses a :class:`File` object, based on the
     file extension.
     Parameters
     ----------
     file_path : str
         The path to the sequence file.
     Returns
     -------
     sequences : dict of (str, Sequence)
         The sequences in the file.
         This dictionary maps each header name to
-        the respective sequence.
+        the respective sequence.
     """
     # We only need the suffix here
     filename, suffix = os.path.splitext(file_path)
     if suffix in [".fasta", ".fa", ".mpfa", ".fna", ".fsa"]:
-        from .fasta import FastaFile, get_sequences
+        from biotite.sequence.io.fasta import FastaFile, get_sequences
         file = FastaFile.read(file_path)
         return get_sequences(file)
     elif suffix in [".fastq", ".fq"]:
-        from .fastq import FastqFile
+        from biotite.sequence.io.fastq import FastqFile
         # Quality scores are irrelevant for this function
         # -> Offset is irrelevant
         file = FastqFile.read(file_path, offset="Sanger")
-        return {identifier : NucleotideSequence(seq_str)
-                for identifier, (seq_str, scores) in file.items()}
+        return {
+            identifier: NucleotideSequence(seq_str)
+            for identifier, (seq_str, scores) in file.items()
+        }
     elif suffix in [".gb", ".gbk", ".gp"]:
-        from .genbank import MultiFile, get_definition, get_sequence
+        from biotite.sequence.io.genbank import MultiFile, get_definition, get_sequence
         file = MultiFile.read(file_path)
         format = "gp" if suffix == ".gp" else "gb"
         sequences = OrderedDict()
@@ -154,10 +161,10 @@ def save_sequences(file_path, sequences):
     """
     Save multiple sequences into a sequence file without the need
     to manually instantiate a :class:`File` object.
     Internally this function uses a :class:`File` object, based on the
     given file extension.
     Parameters
     ----------
     file_path : str
@@ -169,12 +176,14 @@ def save_sequences(file_path, sequences):
     # We only need the suffix here
     filename, suffix = os.path.splitext(file_path)
     if suffix in [".fasta", ".fa", ".mpfa", ".fna", ".fsa"]:
-        from .fasta import FastaFile, set_sequences
+        from biotite.sequence.io.fasta import FastaFile, set_sequences
         file = FastaFile()
         set_sequences(file, sequences)
         file.write(file_path)
     elif suffix in [".fastq", ".fq"]:
-        from .fastq import FastqFile
+        from biotite.sequence.io.fastq import FastqFile
         # Quality scores are irrelevant for this function
         # -> Offset is irrelevant
         file = FastqFile(offset="Sanger")

biotite/sequence/io/gff/__init__.py CHANGED Viewed

@@ -14,7 +14,7 @@ interface to this format, and high-level functions for extracting
    GFF 3 files. This means, that you cannot directly access the the
    parent or child of a feature.
    However, the ``Id`` and ``Name`` attributes are stored in the
-   qualifiers of the created :class:`Feature` objects.
+   qualifiers of the created :class:`Feature` objects.
    Hence, it is possible to implement such a data structure from this
    information.
 """
@@ -22,5 +22,5 @@ interface to this format, and high-level functions for extracting
 __name__ = "biotite.sequence.io.gff"
 __author__ = "Patrick Kunzmann"
+from .convert import *
 from .file import *
-from .convert import *

biotite/sequence/io/gff/convert.py CHANGED Viewed

@@ -6,7 +6,7 @@ __name__ = "biotite.sequence.io.gff"
 __author__ = "Patrick Kunzmann"
 __all__ = ["get_annotation", "set_annotation"]
-from ...annotation import Location, Feature, Annotation
+from biotite.sequence.annotation import Annotation, Feature, Location
 def get_annotation(gff_file):
@@ -22,12 +22,12 @@ def get_annotation(gff_file):
     Thus, for entries with the same ``ID``, the *type* and *attributes*
     are only parsed once and the locations are aggregated from each
     entry.
     Parameters
     ----------
     gff_file : GFFFile
         The file tro extract the :class:`Annotation` object from.
     Returns
     -------
     annotation : Annotation
@@ -45,9 +45,7 @@ def get_annotation(gff_file):
             # (beginning of the file)
             if current_key is not None:
                 # Beginning of new feature -> Save previous feature
-                annot.add_feature(
-                    Feature(current_key, current_locs, current_qual)
-                )
+                annot.add_feature(Feature(current_key, current_locs, current_qual))
             # Track new feature
             current_key = type
             current_locs = [Location(start, end, strand)]
@@ -61,15 +59,14 @@ def get_annotation(gff_file):
     return annot
-def set_annotation(gff_file, annotation,
-                   seqid=None, source=None, is_stranded=True):
+def set_annotation(gff_file, annotation, seqid=None, source=None, is_stranded=True):
     """
     Write an :class:`Annotation` object into a GFF3 file.
     Each feature will get one entry for each location it has.
     :class:`Feature` objects with multiple locations require the ``ID``
     qualifier in its :attr:`Feature.qual` attribute.
     Parameters
     ----------
     gff_file : GFFFile
@@ -87,14 +84,13 @@ def set_annotation(gff_file, annotation,
     for feature in sorted(annotation):
         if len(feature.locs) > 1 and "ID" not in feature.qual:
             raise ValueError(
-                "The 'Id' qualifier is required "
-                "for features with multiple locations"
+                "The 'Id' qualifier is required " "for features with multiple locations"
             )
         ## seqid ##
         if seqid is not None and " " in seqid:
             raise ValueError("The 'seqid' must not contain whitespaces")
         ## source ##
-        #Nothing to be done
+        # Nothing to be done
         ## type ##
         type = feature.key
         ## strand ##
@@ -128,6 +124,5 @@ def set_annotation(gff_file, annotation,
             else:
                 phase = None
             gff_file.append(
-                seqid, source, type, start, end,
-                score, strand, phase, attributes
-            )
+                seqid, source, type, start, end, score, strand, phase, attributes
+            )

biotite/sequence/io/gff/file.py CHANGED Viewed

@@ -6,19 +6,17 @@ __name__ = "biotite.sequence.io.gff"
 __author__ = "Patrick Kunzmann"
 __all__ = ["GFFFile"]
-import copy
 import string
-from urllib.parse import quote, unquote
 import warnings
-from ....file import TextFile, InvalidFileError
-from ...annotation import Location
+from urllib.parse import quote, unquote
+from biotite.file import InvalidFileError, TextFile
+from biotite.sequence.annotation import Location
 # All punctuation characters except
 # percent, semicolon, equals, ampersand, comma
-_NOT_QUOTED = "".join(
-    [char for char in string.punctuation if char not in "%;=&,"]
-) + " "
+_NOT_QUOTED = (
+    "".join([char for char in string.punctuation if char not in "%;=&,"]) + " "
+)
 class GFFFile(TextFile):
@@ -61,7 +59,7 @@ class GFFFile(TextFile):
     The content after the ``##FASTA`` directive is simply ignored.
     Please provide the sequence via a separate file or read the FASTA
     data directly via the :attr:`lines` attribute:
     >>> import os.path
     >>> from io import StringIO
     >>> gff_file = GFFFile.read(os.path.join(path_to_sequences, "indexing_test.gff3"))
@@ -121,7 +119,7 @@ class GFFFile(TextFile):
     ##Example directive param1 param2
     SomeSeqID   Biotite CDS     1       99      .       +       0       ID=FeatureID;product=A protein
     """
     def __init__(self):
         super().__init__()
         # Maps entry indices to line indices
@@ -132,18 +130,18 @@ class GFFFile(TextFile):
         self._has_fasta = None
         self._index_entries()
         self.append_directive("gff-version", "3")
     @classmethod
     def read(cls, file):
         """
         Read a GFF3 file.
         Parameters
         ----------
         file : file-like object or str
             The file to be read.
             Alternatively a file path can be supplied.
         Returns
         -------
         file_object : GFFFile
@@ -152,18 +150,29 @@ class GFFFile(TextFile):
         file = super().read(file)
         file._index_entries()
         return file
-    def insert(self, index, seqid, source, type, start, end,
-               score, strand, phase, attributes=None):
+    def insert(
+        self,
+        index,
+        seqid,
+        source,
+        type,
+        start,
+        end,
+        score,
+        strand,
+        phase,
+        attributes=None,
+    ):
         """
         Insert an entry at the given index.
         Parameters
         ----------
         index : int
             Index where the entry is inserted.
             If the index is equal to the length of the file, the entry
-            is appended at the end of the file.
+            is appended at the end of the file.
         seqid : str
             The ID of the reference sequence.
         source : str
@@ -184,22 +193,23 @@ class GFFFile(TextFile):
             Additional properties of the feature.
         """
         if index == len(self):
-            self.append(seqid, source, type, start, end,
-                        score, strand, phase, attributes)
+            self.append(
+                seqid, source, type, start, end, score, strand, phase, attributes
+            )
         else:
             line_index = self._entries[index]
             line = GFFFile._create_line(
-                seqid, source, type, start, end,
-                score, strand, phase, attributes
+                seqid, source, type, start, end, score, strand, phase, attributes
             )
             self.lines.insert(line_index, line)
             self._index_entries()
-    def append(self, seqid, source, type, start, end,
-               score, strand, phase, attributes=None):
+    def append(
+        self, seqid, source, type, start, end, score, strand, phase, attributes=None
+    ):
         """
         Append an entry to the end of the file.
         Parameters
         ----------
         seqid : str
@@ -232,11 +242,11 @@ class GFFFile(TextFile):
         self.lines.append(line)
         # Fast update of entry index by adding last line
         self._entries.append(len(self.lines) - 1)
     def append_directive(self, directive, *args):
         """
         Append a directive line to the end of the file.
         Parameters
         ----------
         directive : str
@@ -245,13 +255,13 @@ class GFFFile(TextFile):
             Optional parameters for the directive.
             Each argument is simply appended to the directive, separated
             by a single space character.
         Raises
         ------
         NotImplementedError
             If the ``##FASTA`` directive is used, which is not
             supported.
         Examples
         --------
@@ -262,17 +272,15 @@ class GFFFile(TextFile):
         ##Example directive param1 param2
         """
         if directive.startswith("FASTA"):
-            raise NotImplementedError(
-                "Adding FASTA information is not supported"
-            )
+            raise NotImplementedError("Adding FASTA information is not supported")
         directive_line = "##" + directive + " " + " ".join(args)
         self._directives.append((directive_line[2:], len(self.lines)))
         self.lines.append(directive_line)
     def directives(self):
         """
         Get the directives in the file.
         Returns
         -------
         directives : list of tuple(str, int)
@@ -283,7 +291,7 @@ class GFFFile(TextFile):
         """
         # Sort in line order
         return sorted(self._directives, key=lambda directive: directive[1])
     def __setitem__(self, index, item):
         seqid, source, type, start, end, score, strand, phase, attrib = item
         line = GFFFile._create_line(
@@ -292,15 +300,13 @@ class GFFFile(TextFile):
         line_index = self._entries[index]
         self.lines[line_index] = line
     def __getitem__(self, index):
-        if (index >= 0 and  index >= len(self)) or \
-           (index <  0 and -index >  len(self)):
-                raise IndexError(
-                    f"Index {index} is out of range for GFFFile with "
-                    f"{len(self)} entries"
-                )
+        if (index >= 0 and index >= len(self)) or (index < 0 and -index > len(self)):
+            raise IndexError(
+                f"Index {index} is out of range for GFFFile with "
+                f"{len(self)} entries"
+            )
         line_index = self._entries[index]
         # Columns are tab separated
         s = self.lines[line_index].strip().split("\t")
@@ -324,15 +330,15 @@ class GFFFile(TextFile):
         attrib = GFFFile._parse_attributes(attrib)
         return seqid, source, type, start, end, score, strand, phase, attrib
     def __delitem__(self, index):
         line_index = self._entries[index]
         del self.lines[line_index]
         self._index_entries()
     def __len__(self):
         return len(self._entries)
     def _index_entries(self):
         """
         Parse the file for comment and directive lines.
@@ -374,15 +380,12 @@ class GFFFile(TextFile):
         self._entries = self._entries[:entry_counter]
     @staticmethod
-    def _create_line(seqid, source, type, start, end,
-                     score, strand, phase, attributes):
+    def _create_line(seqid, source, type, start, end, score, strand, phase, attributes):
         """
         Create a line for a newly created entry.
         """
-        seqid = quote(seqid.strip(), safe=_NOT_QUOTED) \
-                if seqid is not None else "."
-        source = quote(source.strip(), safe=_NOT_QUOTED) \
-                 if source is not None else "."
+        seqid = quote(seqid.strip(), safe=_NOT_QUOTED) if seqid is not None else "."
+        source = quote(source.strip(), safe=_NOT_QUOTED) if source is not None else "."
         type = type.strip()
         # Perform checks
@@ -394,7 +397,7 @@ class GFFFile(TextFile):
             raise ValueError("'type' must not be empty")
         if seqid[0] == ">":
             raise ValueError("'seqid' must not start with '>'")
         score = str(score) if score is not None else "."
         if strand == Location.Strand.FORWARD:
             strand = "+"
@@ -403,16 +406,31 @@ class GFFFile(TextFile):
         else:
             strand = "."
         phase = str(phase) if phase is not None else "."
-        attributes = ";".join(
-            [quote(key, safe=_NOT_QUOTED) + "=" + quote(val, safe=_NOT_QUOTED)
-             for key, val in attributes.items()]
-        ) if attributes is not None and len(attributes) > 0 else "."
+        attributes = (
+            ";".join(
+                [
+                    quote(key, safe=_NOT_QUOTED) + "=" + quote(val, safe=_NOT_QUOTED)
+                    for key, val in attributes.items()
+                ]
+            )
+            if attributes is not None and len(attributes) > 0
+            else "."
+        )
         return "\t".join(
-            [seqid, source, type, str(start), str(end),
-             str(score), strand, phase, attributes]
+            [
+                seqid,
+                source,
+                type,
+                str(start),
+                str(end),
+                str(score),
+                strand,
+                phase,
+                attributes,
+            ]
         )
     @staticmethod
     def _parse_attributes(attributes):
         """
@@ -426,9 +444,7 @@ class GFFFile(TextFile):
         for entry in attrib_entries:
             compounds = entry.split("=")
             if len(compounds) != 2:
-                raise InvalidFileError(
-                    f"Attribute entry '{entry}' is invalid"
-                )
+                raise InvalidFileError(f"Attribute entry '{entry}' is invalid")
             key, val = compounds
             attrib_dict[unquote(key)] = unquote(val)
-        return attrib_dict
+        return attrib_dict

biotite/sequence/phylo/__init__.py CHANGED Viewed

@@ -31,6 +31,6 @@ popular *UPGMA* (:func:`upgma()`) and *Neighbor-Joining*
 __name__ = "biotite.sequence.phylo"
 __author__ = "Patrick Kunzmann"
+from .nj import *
 from .tree import *
 from .upgma import *
-from .nj import *

biotite/sequence/phylo/nj.cp311-win_amd64.pyd CHANGED Viewed

Binary file

biotite/sequence/phylo/tree.cp311-win_amd64.pyd CHANGED Viewed

Binary file

biotite/sequence/phylo/upgma.cp311-win_amd64.pyd CHANGED Viewed

Binary file