rcsb.exdb 1.25__tar.gz → 1.26__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/HISTORY.txt +2 -0
- {rcsb_exdb-1.25/rcsb.exdb.egg-info → rcsb_exdb-1.26}/PKG-INFO +2 -2
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/cli/__init__.py +1 -1
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/seq/PolymerEntityExtractor.py +7 -1
- {rcsb_exdb-1.25 → rcsb_exdb-1.26/rcsb.exdb.egg-info}/PKG-INFO +2 -2
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb.exdb.egg-info/requires.txt +1 -1
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/requirements.txt +1 -1
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/LICENSE +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/MANIFEST.in +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/README.md +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/__init__.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/__init__.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/branch/BranchedEntityExtractor.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/branch/GlycanProvider.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/branch/GlycanUtils.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/branch/__init__.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/chemref/ChemRefEtlWorker.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/chemref/ChemRefExtractor.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/chemref/ChemRefMappingProvider.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/chemref/PubChemDataCacheProvider.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/chemref/PubChemEtlWrapper.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/chemref/PubChemIndexCacheProvider.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/chemref/__init__.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/citation/CitationAdapter.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/citation/CitationExtractor.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/citation/CitationUtils.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/citation/__init__.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/cli/ExDbExec.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/entry/EntryInfoProvider.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/entry/__init__.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/seq/AnnotationExtractor.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/seq/LigandNeighborMappingExtractor.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/seq/LigandNeighborMappingProvider.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/seq/ReferenceSequenceAnnotationAdapter.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/seq/ReferenceSequenceAnnotationProvider.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/seq/ReferenceSequenceAssignmentAdapter.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/seq/ReferenceSequenceAssignmentProvider.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/seq/ReferenceSequenceCacheProvider.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/seq/TaxonomyExtractor.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/seq/UniProtCoreEtlWorker.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/seq/UniProtExtractor.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/seq/__init__.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/__init__.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/fixtureDictMethodResourceProvider.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/fixturePdbxLoader.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testAnnotationExtractor.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testBranchedEntityExtractor.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testChemRefLoader.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testChemRefMappingProvider.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testCitationAdapter.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testCitationExtractor.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testCitationUtils.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testEntryInfoEtlWorkflow.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testEntryInfoProvider.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testExDbWorkflow.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testGlycanEtlWorkflow.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testGlycanProvider.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testGlycanUtils.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testLigandNeighborMappingProvider.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testObjectExtractor.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testObjectTransformer.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testObjectUpdater.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testPolymerEntityExtractor.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testPubChemDataCacheProvider.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testPubChemEtlWorkflow.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testPubChemEtlWrapper.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testPubChemIndexCacheProvider.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testReferenceSequenceAnnotationAdapter.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testReferenceSequenceAssignmentAdapter.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testReferenceSequenceAssignmentAdapterValidate.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testReferenceSequenceAssignmentProvider.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testReferenceSequenceCacheProvider.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testTaxonomyExtractor.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testTreeNodeListWorker.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testUniProtCoreEtlWorker.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testUniProtExtractor.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tree/TreeNodeListWorker.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tree/__init__.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/utils/ObjectAdapterBase.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/utils/ObjectExtractor.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/utils/ObjectTransformer.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/utils/ObjectUpdater.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/utils/ObjectValidator.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/utils/__init__.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/wf/EntryInfoEtlWorkflow.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/wf/ExDbWorkflow.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/wf/GlycanEtlWorkflow.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/wf/PubChemEtlWorkflow.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/wf/__init__.py +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb.exdb.egg-info/SOURCES.txt +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb.exdb.egg-info/dependency_links.txt +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb.exdb.egg-info/entry_points.txt +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb.exdb.egg-info/not-zip-safe +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb.exdb.egg-info/top_level.txt +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/setup.cfg +0 -0
- {rcsb_exdb-1.25 → rcsb_exdb-1.26}/setup.py +0 -0
|
@@ -106,3 +106,5 @@
|
|
|
106
106
|
27-Aug-2024 V1.24 Update tree loading for CARD ontology data
|
|
107
107
|
22-Oct-2024 V1.25 Add CLI for CCD image and file generation;
|
|
108
108
|
Update CI/CD to python 3.10
|
|
109
|
+
10-Dec-2024 V1.26 Update PolymerEntityExtractor to sort extracted sequence data;
|
|
110
|
+
Update Azure pipelines to run on latest macOS and ubuntu version
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.1
|
|
2
2
|
Name: rcsb.exdb
|
|
3
|
-
Version: 1.
|
|
3
|
+
Version: 1.26
|
|
4
4
|
Summary: RCSB Python ExDB data extraction and loading workflows
|
|
5
5
|
Home-page: https://github.com/rcsb/py-rcsb_exdb
|
|
6
6
|
Author: John Westbrook
|
|
@@ -28,7 +28,7 @@ Requires-Dist: rcsb.utils.config>=0.40
|
|
|
28
28
|
Requires-Dist: rcsb.utils.ec>=0.25
|
|
29
29
|
Requires-Dist: rcsb.utils.go>=0.18
|
|
30
30
|
Requires-Dist: rcsb.utils.seq>=0.82
|
|
31
|
-
Requires-Dist: rcsb.utils.seqalign>=0.
|
|
31
|
+
Requires-Dist: rcsb.utils.seqalign>=0.31
|
|
32
32
|
Requires-Dist: rcsb.utils.targets>=0.82
|
|
33
33
|
Requires-Dist: rcsb.utils.struct>=0.47
|
|
34
34
|
Requires-Dist: rcsb.utils.taxonomy>=0.43
|
|
@@ -7,6 +7,8 @@
|
|
|
7
7
|
#
|
|
8
8
|
# Updates:
|
|
9
9
|
# 9-Jan-2024 dwp Turn off use of uniprot_exdb DB for enriching protein entity details file (data not used)
|
|
10
|
+
# 10-Dec-2024 dwp Sort extracted polymer entity sequence data by entity ID (alphabetically), to ensure consistent
|
|
11
|
+
# ordering between coasts (order of sequence data influences results of mmseqs2 sequence searching)
|
|
10
12
|
#
|
|
11
13
|
##
|
|
12
14
|
__docformat__ = "google en"
|
|
@@ -16,6 +18,7 @@ __license__ = "Apache 2.0"
|
|
|
16
18
|
|
|
17
19
|
import logging
|
|
18
20
|
import os
|
|
21
|
+
from collections import OrderedDict
|
|
19
22
|
|
|
20
23
|
from rcsb.exdb.utils.ObjectExtractor import ObjectExtractor
|
|
21
24
|
from rcsb.utils.io.MarshalUtil import MarshalUtil
|
|
@@ -175,9 +178,12 @@ class PolymerEntityExtractor(object):
|
|
|
175
178
|
pass
|
|
176
179
|
rD[rId] = {"alignmentL": uDL, "sourceOrgL": sL, "partCount": partCount, "taxCount": taxCount, "sequence": seqS, "seqLen": seqLen}
|
|
177
180
|
|
|
181
|
+
# Sort the dict in alphabetical order (by entity ID key) to ensure consistent/reproducible treatment by mmseqs2
|
|
182
|
+
sortedD = OrderedDict((k, rD.pop(k)) for k in sorted(rD))
|
|
183
|
+
|
|
178
184
|
except Exception as e:
|
|
179
185
|
logger.exception("Failing with %s", str(e))
|
|
180
|
-
return
|
|
186
|
+
return sortedD, missingSrcD
|
|
181
187
|
|
|
182
188
|
def __getSourcePart(self, entityId, sourceOrgL, entityBeg, seqLen):
|
|
183
189
|
"""Return the source part containing the input entity range -
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.1
|
|
2
2
|
Name: rcsb.exdb
|
|
3
|
-
Version: 1.
|
|
3
|
+
Version: 1.26
|
|
4
4
|
Summary: RCSB Python ExDB data extraction and loading workflows
|
|
5
5
|
Home-page: https://github.com/rcsb/py-rcsb_exdb
|
|
6
6
|
Author: John Westbrook
|
|
@@ -28,7 +28,7 @@ Requires-Dist: rcsb.utils.config>=0.40
|
|
|
28
28
|
Requires-Dist: rcsb.utils.ec>=0.25
|
|
29
29
|
Requires-Dist: rcsb.utils.go>=0.18
|
|
30
30
|
Requires-Dist: rcsb.utils.seq>=0.82
|
|
31
|
-
Requires-Dist: rcsb.utils.seqalign>=0.
|
|
31
|
+
Requires-Dist: rcsb.utils.seqalign>=0.31
|
|
32
32
|
Requires-Dist: rcsb.utils.targets>=0.82
|
|
33
33
|
Requires-Dist: rcsb.utils.struct>=0.47
|
|
34
34
|
Requires-Dist: rcsb.utils.taxonomy>=0.43
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testReferenceSequenceAssignmentAdapterValidate.py
RENAMED
|
File without changes
|
{rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testReferenceSequenceAssignmentProvider.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|