PyPI - biotite - Versions diffs - 0.38.0__cp311-cp311-macosx_11_0_arm64.whl → 0.40.0__cp311-cp311-macosx_11_0_arm64.whl - Mend

biotite 0.38.0__cp311-cp311-macosx_11_0_arm64.whl → 0.40.0__cp311-cp311-macosx_11_0_arm64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of biotite might be problematic. Click here for more details.

Files changed (124) hide show

biotite/__init__.py +3 -3
biotite/application/application.py +33 -28
biotite/application/dssp/app.py +18 -18
biotite/application/sra/__init__.py +5 -0
biotite/application/sra/app.py +337 -55
biotite/database/entrez/__init__.py +2 -1
biotite/database/entrez/check.py +14 -3
biotite/database/entrez/download.py +20 -13
biotite/database/entrez/key.py +44 -0
biotite/database/entrez/query.py +38 -34
biotite/database/pubchem/query.py +44 -44
biotite/database/rcsb/download.py +19 -14
biotite/database/rcsb/query.py +46 -46
biotite/sequence/align/__init__.py +5 -1
biotite/sequence/align/banded.c +1408 -1025
biotite/sequence/align/banded.cpython-311-darwin.so +0 -0
biotite/sequence/align/buckets.py +69 -0
biotite/sequence/align/cigar.py +389 -0
biotite/sequence/align/kmeralphabet.c +3220 -2850
biotite/sequence/align/kmeralphabet.cpython-311-darwin.so +0 -0
biotite/sequence/align/kmersimilarity.c +713 -663
biotite/sequence/align/kmersimilarity.cpython-311-darwin.so +0 -0
biotite/sequence/align/kmertable.cpp +68398 -0
biotite/sequence/align/kmertable.cpython-311-darwin.so +0 -0
biotite/sequence/align/localgapped.c +1507 -1074
biotite/sequence/align/localgapped.cpython-311-darwin.so +0 -0
biotite/sequence/align/localungapped.c +1143 -833
biotite/sequence/align/localungapped.cpython-311-darwin.so +0 -0
biotite/sequence/align/multiple.c +1569 -1092
biotite/sequence/align/multiple.cpython-311-darwin.so +0 -0
biotite/sequence/align/pairwise.c +1612 -1212
biotite/sequence/align/pairwise.cpython-311-darwin.so +0 -0
biotite/sequence/align/permutation.c +33259 -0
biotite/sequence/align/permutation.cpython-311-darwin.so +0 -0
biotite/sequence/align/primes.txt +821 -0
biotite/sequence/align/{kmertable.c → selector.c} +9129 -16497
biotite/sequence/align/selector.cpython-311-darwin.so +0 -0
biotite/sequence/align/tracetable.c +685 -646
biotite/sequence/align/tracetable.cpython-311-darwin.so +0 -0
biotite/sequence/codec.c +1159 -841
biotite/sequence/codec.cpython-311-darwin.so +0 -0
biotite/sequence/graphics/alignment.py +212 -2
biotite/sequence/io/genbank/annotation.py +11 -11
biotite/sequence/phylo/nj.c +684 -636
biotite/sequence/phylo/nj.cpython-311-darwin.so +0 -0
biotite/sequence/phylo/tree.c +970 -673
biotite/sequence/phylo/tree.cpython-311-darwin.so +0 -0
biotite/sequence/phylo/upgma.c +672 -626
biotite/sequence/phylo/upgma.cpython-311-darwin.so +0 -0
biotite/structure/__init__.py +1 -1
biotite/structure/atoms.py +1 -1
biotite/structure/basepairs.py +7 -12
biotite/structure/bonds.c +3861 -3749
biotite/structure/bonds.cpython-311-darwin.so +0 -0
biotite/structure/celllist.c +727 -707
biotite/structure/celllist.cpython-311-darwin.so +0 -0
biotite/structure/charges.c +1561 -1560
biotite/structure/charges.cpython-311-darwin.so +0 -0
biotite/structure/filter.py +30 -37
biotite/structure/info/__init__.py +5 -8
biotite/structure/info/atoms.py +25 -67
biotite/structure/info/bonds.py +46 -100
biotite/structure/info/ccd/README.rst +8 -0
biotite/structure/info/ccd/amino_acids.txt +1646 -0
biotite/structure/info/ccd/carbohydrates.txt +1133 -0
biotite/structure/info/ccd/components.bcif +0 -0
biotite/structure/info/ccd/nucleotides.txt +797 -0
biotite/structure/info/ccd.py +95 -0
biotite/structure/info/groups.py +90 -0
biotite/structure/info/masses.py +21 -20
biotite/structure/info/misc.py +11 -22
biotite/structure/info/standardize.py +17 -12
biotite/structure/io/__init__.py +2 -4
biotite/structure/io/ctab.py +1 -1
biotite/structure/io/general.py +37 -43
biotite/structure/io/mmtf/__init__.py +3 -0
biotite/structure/io/mmtf/convertarray.c +528 -365
biotite/structure/io/mmtf/convertarray.cpython-311-darwin.so +0 -0
biotite/structure/io/mmtf/convertfile.c +725 -676
biotite/structure/io/mmtf/convertfile.cpython-311-darwin.so +0 -0
biotite/structure/io/mmtf/decode.c +1070 -754
biotite/structure/io/mmtf/decode.cpython-311-darwin.so +0 -0
biotite/structure/io/mmtf/encode.c +727 -677
biotite/structure/io/mmtf/encode.cpython-311-darwin.so +0 -0
biotite/structure/io/mmtf/file.py +34 -26
biotite/structure/io/npz/__init__.py +3 -0
biotite/structure/io/npz/file.py +21 -18
biotite/structure/io/pdb/__init__.py +3 -3
biotite/structure/io/pdb/file.py +72 -70
biotite/structure/io/pdb/hybrid36.c +540 -478
biotite/structure/io/pdb/hybrid36.cpython-311-darwin.so +0 -0
biotite/structure/io/pdbqt/file.py +82 -68
biotite/structure/io/pdbx/__init__.py +13 -6
biotite/structure/io/pdbx/bcif.py +649 -0
biotite/structure/io/pdbx/cif.py +1028 -0
biotite/structure/io/pdbx/component.py +243 -0
biotite/structure/io/pdbx/convert.py +707 -359
biotite/structure/io/pdbx/encoding.c +112813 -0
biotite/structure/io/pdbx/encoding.cpython-311-darwin.so +0 -0
biotite/structure/io/pdbx/error.py +14 -0
biotite/structure/io/pdbx/legacy.py +267 -0
biotite/structure/molecules.py +151 -151
biotite/structure/residues.py +40 -40
biotite/structure/sasa.c +713 -644
biotite/structure/sasa.cpython-311-darwin.so +0 -0
biotite/structure/superimpose.py +158 -115
biotite/visualize.py +9 -11
{biotite-0.38.0.dist-info → biotite-0.40.0.dist-info}/METADATA +2 -2
{biotite-0.38.0.dist-info → biotite-0.40.0.dist-info}/RECORD +112 -102
{biotite-0.38.0.dist-info → biotite-0.40.0.dist-info}/WHEEL +1 -1
biotite/structure/info/amino_acids.json +0 -1556
biotite/structure/info/amino_acids.py +0 -42
biotite/structure/info/carbohydrates.json +0 -1122
biotite/structure/info/carbohydrates.py +0 -39
biotite/structure/info/intra_bonds.msgpack +0 -0
biotite/structure/info/link_types.msgpack +0 -1
biotite/structure/info/nucleotides.json +0 -772
biotite/structure/info/nucleotides.py +0 -39
biotite/structure/info/residue_masses.msgpack +0 -0
biotite/structure/info/residue_names.msgpack +0 -3
biotite/structure/info/residues.msgpack +0 -0
biotite/structure/io/pdbx/file.py +0 -652
{biotite-0.38.0.dist-info → biotite-0.40.0.dist-info}/LICENSE.rst +0 -0
{biotite-0.38.0.dist-info → biotite-0.40.0.dist-info}/top_level.txt +0 -0

biotite/database/rcsb/query.py CHANGED Viewed

@@ -32,7 +32,7 @@ _scope_to_target = {
 class Query(metaclass=abc.ABCMeta):
     """
     A representation of a JSON query for the RCSB search API.
     This is the abstract base class for all queries.
     """
     @abc.abstractmethod
@@ -62,7 +62,7 @@ class Query(metaclass=abc.ABCMeta):
 class SingleQuery(Query, metaclass=abc.ABCMeta):
     """
     A terminal query node for the RCSB search API.
     Multiple :class:`SingleQuery` objects can be combined to
     :class:`CompositeQuery`objects using the ``|`` and ``&`` operators.
@@ -77,7 +77,7 @@ class SingleQuery(Query, metaclass=abc.ABCMeta):
 class CompositeQuery(Query):
     """
     A group query node for the RCSB search API.
     A composite query is an combination of other queries, combined
     either with the `'and'` or `'or'` operator.
     Usually, a :class:`CompositeQuery` will not be created by calling
@@ -98,11 +98,11 @@ class CompositeQuery(Query):
                 f"Operator must be 'or' or 'and', not '{operator}'"
             )
         self._operator = operator
     def get_content(self):
         """
         A dictionary representation of the query.
-        This dictionary is the content of the ``'query'`` key in the
+        This dictionary is the content of the ``'query'`` key in the
         JSON query.
         Returns
@@ -133,13 +133,13 @@ class BasicQuery(SingleQuery):
         The matching is not case-sensitive.
         Logic combinations of terms is described
         `here <https://search.rcsb.org/#basic-queries>`_.
     Examples
     --------
     >>> query = BasicQuery("tc5b")
-    >>> print(search(query))
-    ['1L2Y', '8ANM', '8ANH', '8ANG', '8ANI']
+    >>> print(sorted(search(query)))
+    ['1L2Y', '8ANG', '8ANH', '8ANI', '8ANM']
     """
     def __init__(self, term):
         super().__init__()
@@ -207,7 +207,7 @@ class FieldQuery(SingleQuery):
     Examples
     --------
     >>> query = FieldQuery("reflns.d_resolution_high", less_or_equal=0.6)
     >>> print(sorted(search(query)))
     ['1EJG', '1I0T', '3NIR', '3P4J', '4JLJ', '5D8V', '5NW3', '7ATG', '7R0H']
@@ -218,7 +218,7 @@ class FieldQuery(SingleQuery):
         self._field = field
         self._mol_definition = molecular_definition
         self._case_sensitive = case_sensitive
         if len(kwargs) > 1:
             raise TypeError("Only one operator must be given")
         elif len(kwargs) == 1:
@@ -228,7 +228,7 @@ class FieldQuery(SingleQuery):
             # No operator is given
             self._operator = "exists"
             self._value = None
         if self._operator not in [
             "exact_match",
             "contains_words", "contains_phrase",
@@ -241,7 +241,7 @@ class FieldQuery(SingleQuery):
                 f"Constructor got an unexpected keyword argument "
                 f"'{self._operator}'"
             )
         # Convert dates into ISO 8601
         if isinstance(self._value, datetime):
              self._value = _to_isoformat(self._value)
@@ -250,7 +250,7 @@ class FieldQuery(SingleQuery):
                 _to_isoformat(val) if isinstance(val, datetime) else val
                 for val in self._value
             ]
         # Create dictionary for 'range' operator
         if self._operator == "range":
             self._value = {
@@ -266,7 +266,7 @@ class FieldQuery(SingleQuery):
                 "to": self._value[1],
                 "include_upper": True
             }
         # Rename operators to names used in API
         if self._operator == "is_in":
             # 'in' is not an available parameter name in Python
@@ -326,7 +326,7 @@ class SequenceQuery(SingleQuery):
     Examples
     --------
     >>> sequence = "NLYIQWLKDGGPSSGRPPPS"
     >>> query = SequenceQuery(sequence, scope="protein", min_identity=0.8)
     >>> print(sorted(search(query)))
@@ -338,12 +338,12 @@ class SequenceQuery(SingleQuery):
         self._target = _scope_to_target.get(scope.lower())
         if self._target is None:
             raise ValueError(f"'{scope}' is an invalid scope")
         if isinstance(sequence, NucleotideSequence) and scope.lower() == "rna":
             self._sequence = str(sequence).replace("T", "U")
         else:
             self._sequence = str(sequence)
         self._min_identity = min_identity
         self._max_expect_value = max_expect_value
@@ -371,10 +371,10 @@ class MotifQuery(SingleQuery):
         The type of the pattern.
     scope : {'protein', 'dna', 'rna'}
         The type of molecule to find.
     Examples
     --------
     >>> query = MotifQuery(
     ...     "C-x(2,4)-C-x(3)-[LIVMFYWC]-x(8)-H-x(3,5)-H.",
     ...     "prosite",
@@ -416,7 +416,7 @@ class StructureQuery(SingleQuery):
     strict : bool, optional
         If true, structure comparison is strict, otherwise it is
         relaxed.
     Examples
     --------
@@ -442,7 +442,7 @@ class StructureQuery(SingleQuery):
                 "entry_id": pdb_id,
                 "asym_id": chain
             }
         self._operator = "strict_shape_match" if strict \
                          else "relaxed_shape_match"
@@ -462,7 +462,7 @@ class Sorting:
     def __init__(self, field, descending=True):
         self._field = field
         self._descending = descending
     @property
     def field(self):
         return self._field
@@ -470,7 +470,7 @@ class Sorting:
     @property
     def descending(self):
         return self._descending
     def get_content(self):
         """
         Get the sorting content, i.e. the data belonging to the
@@ -497,7 +497,7 @@ class Sorting:
 class Grouping(metaclass=abc.ABCMeta):
     """
-    A representation of the JSON grouping options of the RCSB search
+    A representation of the JSON grouping options of the RCSB search
     API.
     Parameters
@@ -521,7 +521,7 @@ class Grouping(metaclass=abc.ABCMeta):
             self._sorting = sort_by
         else:
             self._sorting = Sorting(sort_by)
     @abc.abstractmethod
     def get_content(self):
         """
@@ -542,7 +542,7 @@ class Grouping(metaclass=abc.ABCMeta):
             return {"ranking_criteria_type" : self._sorting.get_content()}
         else:
             return {}
     @abc.abstractmethod
     def is_compatible_return_type(self, return_type):
         """
@@ -555,7 +555,7 @@ class Grouping(metaclass=abc.ABCMeta):
         ----------
         return_type : str
             The ``return_type`` attribute to be checked.
         Returns
         -------
         is_compatible : bool
@@ -593,7 +593,7 @@ class DepositGrouping(Grouping):
         content = super().get_content()
         content["aggregation_method"] = "matching_deposit_group_id"
         return content
     def is_compatible_return_type(self, return_type):
         return return_type == "entry"
@@ -640,7 +640,7 @@ class IdentityGrouping(Grouping):
         content["aggregation_method"] = "sequence_identity"
         content["similarity_cutoff"] = self._similarity_cutoff
         return content
     def is_compatible_return_type(self, return_type):
         return return_type == "polymer_entity"
@@ -672,7 +672,7 @@ class UniprotGrouping(Grouping):
         content = super().get_content()
         content["aggregation_method"] = "matching_uniprot_accession"
         return content
     def is_compatible_return_type(self, return_type):
         return return_type == "polymer_entity"
@@ -685,9 +685,9 @@ def count(query, return_type="entry", group_by=None,
     """
     Count PDB entries that meet the given query requirements,
     via the RCSB search API.
     This function requires an internet connection.
     Parameters
     ----------
     query : Query
@@ -719,17 +719,17 @@ def count(query, return_type="entry", group_by=None,
     count : int
         The total number of PDB IDs (or groups) that would be returned
         by calling :func:`search()` using the same parameters.
     Notes
     -----
     If `group_by` is set, the number of results may be lower than in an
     ungrouped query, as grouping is not applicable to all structures.
     For example a DNA structure has no associated *Uniprot* accession
     and hence is omitted by :class:`UniprotGrouping`.
     Examples
     --------
     >>> query = FieldQuery("reflns.d_resolution_high", less_or_equal=0.6)
     >>> print(count(query))
     9
@@ -742,9 +742,9 @@ def count(query, return_type="entry", group_by=None,
     )
     query_dict["request_options"]["return_counts"] = True
     r = requests.get(_search_url, params={"json": json.dumps(query_dict)})
     if r.status_code == 200:
         if group_by is None:
             return r.json()["total_count"]
@@ -766,9 +766,9 @@ def search(query, return_type="entry", range=None, sort_by=None, group_by=None,
     """
     Get all PDB IDs that meet the given query requirements,
     via the RCSB search API.
     This function requires an internet connection.
     Parameters
     ----------
     query : Query
@@ -786,7 +786,7 @@ def search(query, return_type="entry", range=None, sort_by=None, group_by=None,
           of non-polymeric entities is returned (e.g. ``'XXXX_1'``).
         - ``'polymer_instance'``: The PDB ID appended with chain ID
           (more exactly ``'asym_id'``) is returned (e.g. ``'XXXX.A'``).
     range : tuple(int, int), optional
         If this parameter is specified, only PDB IDs in this range
         are selected from all matching PDB IDs and returned
@@ -832,7 +832,7 @@ def search(query, return_type="entry", range=None, sort_by=None, group_by=None,
         returned.
         This dictionary maps group identifiers to a list of all PDB IDs
         belonging to this group.
     Notes
     -----
     If `group_by` is set, the number of results may be lower than in an
@@ -846,7 +846,7 @@ def search(query, return_type="entry", range=None, sort_by=None, group_by=None,
     Examples
     --------
     >>> query = FieldQuery("reflns.d_resolution_high", less_or_equal=0.6)
     >>> print(sorted(search(query)))
     ['1EJG', '1I0T', '3NIR', '3P4J', '4JLJ', '5D8V', '5NW3', '7ATG', '7R0H']
@@ -894,7 +894,7 @@ def search(query, return_type="entry", range=None, sort_by=None, group_by=None,
         }
     r = requests.get(_search_url, params={"json": json.dumps(query_dict)})
     if r.status_code == 200:
         if group_by is None or not return_groups:
             return [result["identifier"] for result in r.json()["result_set"]]
@@ -926,9 +926,9 @@ def _initialize_query_dict(query, return_type, group_by, content_types):
         "polymer_entity", "non_polymer_entity",
     ]:
         raise ValueError(f"'{return_type}' is an invalid return type")
     request_options = {}
     if len(content_types) == 0:
         raise ValueError("At least one content type must be specified")
     for content_type in content_types:

biotite/sequence/align/__init__.py CHANGED Viewed

@@ -26,7 +26,7 @@ The aligning functions are usually C-accelerated, reducing the
 computation time substantially.
 This subpackage also contains functionality for finding *k-mer* matches
-between two sequences, allowing fast heuristic pairwise alignments.
+between two sequences, allowing fast heuristic pairwise alignments.
 """
 __name__ = "biotite.sequence.align"
@@ -34,6 +34,8 @@ __author__ = "Patrick Kunzmann"
 from .alignment import *
 from .banded import *
+from .buckets import *
+from .cigar import *
 from .kmeralphabet import *
 from .kmertable import *
 from .kmersimilarity import *
@@ -42,4 +44,6 @@ from .localungapped import *
 from .matrix import *
 from .multiple import *
 from .pairwise import *
+from .permutation import *
+from .selector import *
 from .statistics import *