rcsb.exdb 1.1__tar.gz → 1.21__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/HISTORY.txt +2 -0
- {rcsb_exdb-1.1/rcsb.exdb.egg-info → rcsb_exdb-1.21}/PKG-INFO +13 -13
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/chemref/ChemRefEtlWorker.py +5 -4
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/chemref/PubChemIndexCacheProvider.py +2 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/cli/ExDbExec.py +2 -2
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/cli/__init__.py +1 -1
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/seq/UniProtCoreEtlWorker.py +1 -1
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/fixturePdbxLoader.py +2 -2
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testExDbWorkflow.py +2 -2
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testReferenceSequenceAnnotationAdapter.py +3 -2
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testReferenceSequenceCacheProvider.py +2 -2
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/utils/ObjectTransformer.py +1 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/utils/ObjectValidator.py +1 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/wf/ExDbWorkflow.py +4 -4
- {rcsb_exdb-1.1 → rcsb_exdb-1.21/rcsb.exdb.egg-info}/PKG-INFO +13 -13
- rcsb_exdb-1.21/rcsb.exdb.egg-info/requires.txt +25 -0
- rcsb_exdb-1.21/requirements.txt +18 -0
- rcsb_exdb-1.1/rcsb.exdb.egg-info/requires.txt +0 -25
- rcsb_exdb-1.1/requirements.txt +0 -18
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/LICENSE +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/MANIFEST.in +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/README.md +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/__init__.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/__init__.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/branch/BranchedEntityExtractor.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/branch/GlycanProvider.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/branch/GlycanUtils.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/branch/__init__.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/chemref/ChemRefExtractor.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/chemref/ChemRefMappingProvider.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/chemref/PubChemDataCacheProvider.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/chemref/PubChemEtlWrapper.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/chemref/__init__.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/citation/CitationAdapter.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/citation/CitationExtractor.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/citation/CitationUtils.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/citation/__init__.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/entry/EntryInfoProvider.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/entry/__init__.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/seq/AnnotationExtractor.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/seq/LigandNeighborMappingExtractor.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/seq/LigandNeighborMappingProvider.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/seq/PolymerEntityExtractor.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/seq/ReferenceSequenceAnnotationAdapter.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/seq/ReferenceSequenceAnnotationProvider.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/seq/ReferenceSequenceAssignmentAdapter.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/seq/ReferenceSequenceAssignmentProvider.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/seq/ReferenceSequenceCacheProvider.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/seq/TaxonomyExtractor.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/seq/UniProtExtractor.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/seq/__init__.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/__init__.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/fixtureDictMethodResourceProvider.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testAnnotationExtractor.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testBranchedEntityExtractor.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testChemRefLoader.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testChemRefMappingProvider.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testCitationAdapter.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testCitationExtractor.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testCitationUtils.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testEntryInfoEtlWorkflow.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testEntryInfoProvider.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testGlycanEtlWorkflow.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testGlycanProvider.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testGlycanUtils.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testLigandNeighborMappingProvider.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testObjectExtractor.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testObjectTransformer.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testObjectUpdater.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testPolymerEntityExtractor.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testPubChemDataCacheProvider.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testPubChemEtlWorkflow.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testPubChemEtlWrapper.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testPubChemIndexCacheProvider.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testReferenceSequenceAssignmentAdapter.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testReferenceSequenceAssignmentAdapterValidate.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testReferenceSequenceAssignmentProvider.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testTaxonomyExtractor.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testTreeNodeListWorker.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testUniProtCoreEtlWorker.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testUniProtExtractor.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tree/TreeNodeListWorker.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tree/__init__.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/utils/ObjectAdapterBase.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/utils/ObjectExtractor.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/utils/ObjectUpdater.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/utils/__init__.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/wf/EntryInfoEtlWorkflow.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/wf/GlycanEtlWorkflow.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/wf/PubChemEtlWorkflow.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/wf/__init__.py +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb.exdb.egg-info/SOURCES.txt +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb.exdb.egg-info/dependency_links.txt +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb.exdb.egg-info/entry_points.txt +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb.exdb.egg-info/not-zip-safe +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb.exdb.egg-info/top_level.txt +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/setup.cfg +0 -0
- {rcsb_exdb-1.1 → rcsb_exdb-1.21}/setup.py +0 -0
|
@@ -99,3 +99,5 @@
|
|
|
99
99
|
This package update also coincides with the turning off of uniprot_exdb data loading during the weekly workflow
|
|
100
100
|
6-May-2024 V1.1 Update ExDbExec CLI and ExDbWorkflow to support CLI usage from weekly-update workflow;
|
|
101
101
|
Update unit tests and setuptools config
|
|
102
|
+
9-May-2024 V1.2 Adjust provider type exclusion input to accept a list of types
|
|
103
|
+
13-May-2024 V1.21 Update requirements; fix linting
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.1
|
|
2
2
|
Name: rcsb.exdb
|
|
3
|
-
Version: 1.
|
|
3
|
+
Version: 1.21
|
|
4
4
|
Summary: RCSB Python ExDB data extraction and loading workflows
|
|
5
5
|
Home-page: https://github.com/rcsb/py-rcsb_exdb
|
|
6
6
|
Author: John Westbrook
|
|
@@ -18,18 +18,18 @@ License-File: LICENSE
|
|
|
18
18
|
Requires-Dist: OpenEye-toolkits>=2020.2.2
|
|
19
19
|
Requires-Dist: numpy
|
|
20
20
|
Requires-Dist: jsonschema>=2.6.0
|
|
21
|
-
Requires-Dist: rcsb.utils.io>=1.
|
|
22
|
-
Requires-Dist: rcsb.db>=1.
|
|
23
|
-
Requires-Dist: rcsb.utils.
|
|
24
|
-
Requires-Dist: rcsb.utils.
|
|
25
|
-
Requires-Dist: rcsb.utils.citation>=0.
|
|
26
|
-
Requires-Dist: rcsb.utils.config>=0.
|
|
27
|
-
Requires-Dist: rcsb.utils.ec>=0.
|
|
28
|
-
Requires-Dist: rcsb.utils.go>=0.
|
|
29
|
-
Requires-Dist: rcsb.utils.seq>=0.
|
|
30
|
-
Requires-Dist: rcsb.utils.struct>=0.
|
|
31
|
-
Requires-Dist: rcsb.utils.taxonomy>=0.
|
|
32
|
-
Requires-Dist: rcsb.utils.dictionary>=
|
|
21
|
+
Requires-Dist: rcsb.utils.io>=1.46
|
|
22
|
+
Requires-Dist: rcsb.db>=1.721
|
|
23
|
+
Requires-Dist: rcsb.utils.chem>=0.79
|
|
24
|
+
Requires-Dist: rcsb.utils.chemref>=0.91
|
|
25
|
+
Requires-Dist: rcsb.utils.citation>=0.22
|
|
26
|
+
Requires-Dist: rcsb.utils.config>=0.40
|
|
27
|
+
Requires-Dist: rcsb.utils.ec>=0.25
|
|
28
|
+
Requires-Dist: rcsb.utils.go>=0.18
|
|
29
|
+
Requires-Dist: rcsb.utils.seq>=0.79
|
|
30
|
+
Requires-Dist: rcsb.utils.struct>=0.47
|
|
31
|
+
Requires-Dist: rcsb.utils.taxonomy>=0.43
|
|
32
|
+
Requires-Dist: rcsb.utils.dictionary>=1.24
|
|
33
33
|
Requires-Dist: rcsb.workflow>=0.42
|
|
34
34
|
Requires-Dist: statistics; python_version < "3.0"
|
|
35
35
|
Provides-Extra: dev
|
|
@@ -65,6 +65,7 @@ class ChemRefEtlWorker(object):
|
|
|
65
65
|
self.__statusList = []
|
|
66
66
|
desp = DataExchangeStatus()
|
|
67
67
|
statusStartTimestamp = desp.setStartTime()
|
|
68
|
+
addValues = {}
|
|
68
69
|
#
|
|
69
70
|
if extResource == "DrugBank":
|
|
70
71
|
databaseName = "drugbank_core"
|
|
@@ -85,10 +86,10 @@ class ChemRefEtlWorker(object):
|
|
|
85
86
|
indexL = sD.getDocumentIndex(collectionName, "primary")
|
|
86
87
|
logger.info("Database %r collection %r index attributes %r", databaseName, collectionName, indexL)
|
|
87
88
|
#
|
|
88
|
-
|
|
89
|
-
|
|
90
|
-
#
|
|
91
|
-
addValues = {}
|
|
89
|
+
# For some reason, 'addValues' was being overwritten with an empty dict (https://github.com/rcsb/py-rcsb_exdb/commit/26bd79e9a2fffc97c034b4116dece9248d1c1f39)
|
|
90
|
+
# Will need to review this -- do we want to add the schema version values or not? (Also, see similar logic in UniProtCoreEtlWorker.py)
|
|
91
|
+
# collectionVersion = sD.getCollectionVersion(collectionName)
|
|
92
|
+
# addValues = {"_schema_version": collectionVersion}
|
|
92
93
|
#
|
|
93
94
|
dl = DocumentLoader(
|
|
94
95
|
self.__cfgOb,
|
|
@@ -64,6 +64,8 @@ class PubChemUpdateWorker(object):
|
|
|
64
64
|
(list): list of ChemicalIdentifier() objects corresponding to the input chemical component.
|
|
65
65
|
"""
|
|
66
66
|
chemIdList = []
|
|
67
|
+
idType = None
|
|
68
|
+
descr = None
|
|
67
69
|
if ccId in self.__lookupD:
|
|
68
70
|
for sD in self.__lookupD[ccId]:
|
|
69
71
|
if "inchi-key" in sD:
|
|
@@ -71,7 +71,7 @@ def main():
|
|
|
71
71
|
#
|
|
72
72
|
parser.add_argument("--rebuild_cache", default=False, action="store_true", help="Rebuild cached resource files")
|
|
73
73
|
parser.add_argument("--rebuild_sequence_cache", default=False, action="store_true", help="Rebuild cached resource files for reference sequence updates")
|
|
74
|
-
parser.add_argument("--
|
|
74
|
+
parser.add_argument("--provider_types_exclude", default=None, help="Resource provider types to exclude")
|
|
75
75
|
parser.add_argument("--use_filtered_tax_list", default=False, action="store_true", help="Use filtered list for taxonomy tree loading")
|
|
76
76
|
parser.add_argument("--disable_read_back_check", default=False, action="store_true", help="Disable read back check on all documents")
|
|
77
77
|
parser.add_argument("--debug", default=False, action="store_true", help="Turn on verbose logging")
|
|
@@ -178,7 +178,7 @@ def processArguments(args):
|
|
|
178
178
|
"mockTopPath": mockTopPath,
|
|
179
179
|
"debugFlag": debugFlag,
|
|
180
180
|
"rebuildCache": args.rebuild_cache,
|
|
181
|
-
"
|
|
181
|
+
"providerTypeExcludeL": args.provider_types_exclude,
|
|
182
182
|
}
|
|
183
183
|
loadD = {
|
|
184
184
|
"loadType": args.load_type,
|
|
@@ -95,6 +95,7 @@ class UniProtCoreEtlWorker(object):
|
|
|
95
95
|
#
|
|
96
96
|
dList = indexL = []
|
|
97
97
|
databaseName = collectionName = collectionVersion = None
|
|
98
|
+
addValues = {}
|
|
98
99
|
#
|
|
99
100
|
if extResource == "UniProt":
|
|
100
101
|
databaseName = "uniprot_core"
|
|
@@ -114,7 +115,6 @@ class UniProtCoreEtlWorker(object):
|
|
|
114
115
|
collectionVersion = cDL[0]["VERSION"]
|
|
115
116
|
indexL = self.__docHelper.getDocumentIndexAttributes(collectionName, "primary")
|
|
116
117
|
logger.info("Database %r collection %r version %r index attributes %r", databaseName, collectionName, collectionVersion, indexL)
|
|
117
|
-
addValues = {}
|
|
118
118
|
else:
|
|
119
119
|
logger.error("Unsupported external resource %r", extResource)
|
|
120
120
|
#
|
|
@@ -48,7 +48,7 @@ class PdbxLoaderFixture(unittest.TestCase):
|
|
|
48
48
|
#
|
|
49
49
|
#
|
|
50
50
|
self.__isMac = platform.system() == "Darwin"
|
|
51
|
-
self.
|
|
51
|
+
self.__excludeTypeL = None if self.__isMac else ["optional"]
|
|
52
52
|
self.__mockTopPath = os.path.join(TOPDIR, "rcsb", "mock-data")
|
|
53
53
|
configPath = os.path.join(TOPDIR, "rcsb", "mock-data", "config", "dbload-setup-example.yml")
|
|
54
54
|
# configPath = os.path.join(TOPDIR, "rcsb", "mock-data", "config", "dbload-setup-example-local.yml")
|
|
@@ -249,7 +249,7 @@ class PdbxLoaderFixture(unittest.TestCase):
|
|
|
249
249
|
validationLevel=kwargs["validationLevel"],
|
|
250
250
|
mergeContentTypes=kwargs["mergeContentTypes"],
|
|
251
251
|
useNameFlag=False,
|
|
252
|
-
|
|
252
|
+
providerTypeExcludeL=self.__excludeTypeL,
|
|
253
253
|
restoreUseGit=True,
|
|
254
254
|
restoreUseStash=False,
|
|
255
255
|
)
|
|
@@ -42,7 +42,7 @@ class ExDbWorkflowTests(unittest.TestCase):
|
|
|
42
42
|
|
|
43
43
|
def setUp(self):
|
|
44
44
|
self.__isMac = platform.system() == "Darwin"
|
|
45
|
-
self.
|
|
45
|
+
self.__excludeTypeL = None if self.__isMac else ["optional"]
|
|
46
46
|
mockTopPath = os.path.join(TOPDIR, "rcsb", "mock-data")
|
|
47
47
|
configPath = os.path.join(mockTopPath, "config", "dbload-setup-example.yml")
|
|
48
48
|
configName = "site_info_configuration"
|
|
@@ -55,7 +55,7 @@ class ExDbWorkflowTests(unittest.TestCase):
|
|
|
55
55
|
"configName": configName,
|
|
56
56
|
"cachePath": cachePath,
|
|
57
57
|
"rebuildCache": False,
|
|
58
|
-
"
|
|
58
|
+
"providerTypeExcludeL": self.__excludeTypeL,
|
|
59
59
|
"restoreUseGit": True,
|
|
60
60
|
"restoreUseStash": False,
|
|
61
61
|
}
|
|
@@ -60,6 +60,7 @@ class ReferenceSequenceAnnotationAdapterTests(unittest.TestCase):
|
|
|
60
60
|
endTime = time.time()
|
|
61
61
|
logger.info("Completed %s at %s (%.4f seconds)", self.id(), time.strftime("%Y %m %d %H:%M:%S", time.localtime()), endTime - self.__startTime)
|
|
62
62
|
|
|
63
|
+
# @unittest.skip("Disable test - no longer using in production, and fails too frequently with 'Bad xml text' when fetching from UniProt")
|
|
63
64
|
def testAnnotationAdapter(self):
|
|
64
65
|
"""Test case - create and read cache reference sequences assignments and related data."""
|
|
65
66
|
try:
|
|
@@ -70,13 +71,13 @@ class ReferenceSequenceAnnotationAdapterTests(unittest.TestCase):
|
|
|
70
71
|
rsaP = ReferenceSequenceAnnotationProvider(
|
|
71
72
|
self.__cfgOb, databaseName, collectionName, polymerType, fetchLimit=self.__fetchLimit, siftsAbbreviated="TEST", cachePath=self.__cachePath, useCache=True
|
|
72
73
|
)
|
|
73
|
-
ok = rsaP.testCache()
|
|
74
|
+
ok = rsaP.testCache(minMissing=10)
|
|
74
75
|
self.assertTrue(ok)
|
|
75
76
|
numRef1 = rsaP.getRefDataCount()
|
|
76
77
|
#
|
|
77
78
|
# --- Reload from cache ---
|
|
78
79
|
rsaP = ReferenceSequenceAnnotationProvider(self.__cfgOb, databaseName, collectionName, polymerType, cachePath=self.__cachePath, useCache=True)
|
|
79
|
-
ok = rsaP.testCache()
|
|
80
|
+
ok = rsaP.testCache(minMissing=10)
|
|
80
81
|
self.assertTrue(ok)
|
|
81
82
|
numRef2 = rsaP.getRefDataCount()
|
|
82
83
|
self.assertEqual(numRef1, numRef2)
|
|
@@ -70,14 +70,14 @@ class ReferenceSequenceCacheProviderTests(unittest.TestCase):
|
|
|
70
70
|
ok = rsaP.testCache()
|
|
71
71
|
self.assertTrue(ok)
|
|
72
72
|
numRef = rsaP.getRefDataCount()
|
|
73
|
-
self.assertGreaterEqual(numRef,
|
|
73
|
+
self.assertGreaterEqual(numRef, 44)
|
|
74
74
|
#
|
|
75
75
|
# --- Reload from cache ---
|
|
76
76
|
rsaP = ReferenceSequenceCacheProvider(self.__cfgOb, databaseName, collectionName, polymerType, maxChunkSize=50, numProc=2, expireDays=14)
|
|
77
77
|
ok = rsaP.testCache()
|
|
78
78
|
self.assertTrue(ok)
|
|
79
79
|
numRef = rsaP.getRefDataCount()
|
|
80
|
-
self.assertGreaterEqual(numRef,
|
|
80
|
+
self.assertGreaterEqual(numRef, 44)
|
|
81
81
|
except Exception as e:
|
|
82
82
|
logger.exception("Failing with %s", str(e))
|
|
83
83
|
self.fail()
|
|
@@ -47,6 +47,7 @@ class ObjectTransformer(object):
|
|
|
47
47
|
docSelectList = docSelectList[:fetchLimit] if fetchLimit else docSelectList
|
|
48
48
|
ok = self.__transform(databaseName, collectionName, docSelectList)
|
|
49
49
|
#
|
|
50
|
+
okS = True
|
|
50
51
|
if updateId:
|
|
51
52
|
okS = self.__updateStatus(updateId, databaseName, collectionName, ok, statusStartTimestamp)
|
|
52
53
|
return ok and okS
|
|
@@ -54,7 +54,7 @@ class ExDbWorkflow(object):
|
|
|
54
54
|
# Rebuild cache (default False)
|
|
55
55
|
rebuildCache = kwargs.get("rebuildCache", False)
|
|
56
56
|
self.__useCache = not rebuildCache
|
|
57
|
-
|
|
57
|
+
providerTypeExcludeL = kwargs.get("providerTypeExcludeL", None)
|
|
58
58
|
restoreUseGit = kwargs.get("restoreUseGit", True)
|
|
59
59
|
restoreUseStash = kwargs.get("restoreUseStash", True)
|
|
60
60
|
self.__cacheStatus = True
|
|
@@ -62,7 +62,7 @@ class ExDbWorkflow(object):
|
|
|
62
62
|
logger.info("Rebuilding cache %r", rebuildCache)
|
|
63
63
|
self.__cacheStatus = self.buildResourceCache(
|
|
64
64
|
rebuildCache=rebuildCache,
|
|
65
|
-
|
|
65
|
+
providerTypeExcludeL=providerTypeExcludeL,
|
|
66
66
|
restoreUseStash=restoreUseStash,
|
|
67
67
|
restoreUseGit=restoreUseGit,
|
|
68
68
|
)
|
|
@@ -204,7 +204,7 @@ class ExDbWorkflow(object):
|
|
|
204
204
|
logger.exception("Failing with %s", str(e))
|
|
205
205
|
return ret
|
|
206
206
|
|
|
207
|
-
def buildResourceCache(self, rebuildCache=False,
|
|
207
|
+
def buildResourceCache(self, rebuildCache=False, providerTypeExcludeL=None, restoreUseStash=True, restoreUseGit=True):
|
|
208
208
|
"""Generate and cache resource dependencies."""
|
|
209
209
|
ret = False
|
|
210
210
|
try:
|
|
@@ -223,7 +223,7 @@ class ExDbWorkflow(object):
|
|
|
223
223
|
cachePath=self.__cachePath,
|
|
224
224
|
restoreUseStash=restoreUseStash,
|
|
225
225
|
restoreUseGit=restoreUseGit,
|
|
226
|
-
|
|
226
|
+
providerTypeExcludeL=providerTypeExcludeL,
|
|
227
227
|
)
|
|
228
228
|
ret = rP.cacheResources(useCache=useCache, doBackup=False)
|
|
229
229
|
logger.info("useCache %r cache reload status (%r)", useCache, ret)
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.1
|
|
2
2
|
Name: rcsb.exdb
|
|
3
|
-
Version: 1.
|
|
3
|
+
Version: 1.21
|
|
4
4
|
Summary: RCSB Python ExDB data extraction and loading workflows
|
|
5
5
|
Home-page: https://github.com/rcsb/py-rcsb_exdb
|
|
6
6
|
Author: John Westbrook
|
|
@@ -18,18 +18,18 @@ License-File: LICENSE
|
|
|
18
18
|
Requires-Dist: OpenEye-toolkits>=2020.2.2
|
|
19
19
|
Requires-Dist: numpy
|
|
20
20
|
Requires-Dist: jsonschema>=2.6.0
|
|
21
|
-
Requires-Dist: rcsb.utils.io>=1.
|
|
22
|
-
Requires-Dist: rcsb.db>=1.
|
|
23
|
-
Requires-Dist: rcsb.utils.
|
|
24
|
-
Requires-Dist: rcsb.utils.
|
|
25
|
-
Requires-Dist: rcsb.utils.citation>=0.
|
|
26
|
-
Requires-Dist: rcsb.utils.config>=0.
|
|
27
|
-
Requires-Dist: rcsb.utils.ec>=0.
|
|
28
|
-
Requires-Dist: rcsb.utils.go>=0.
|
|
29
|
-
Requires-Dist: rcsb.utils.seq>=0.
|
|
30
|
-
Requires-Dist: rcsb.utils.struct>=0.
|
|
31
|
-
Requires-Dist: rcsb.utils.taxonomy>=0.
|
|
32
|
-
Requires-Dist: rcsb.utils.dictionary>=
|
|
21
|
+
Requires-Dist: rcsb.utils.io>=1.46
|
|
22
|
+
Requires-Dist: rcsb.db>=1.721
|
|
23
|
+
Requires-Dist: rcsb.utils.chem>=0.79
|
|
24
|
+
Requires-Dist: rcsb.utils.chemref>=0.91
|
|
25
|
+
Requires-Dist: rcsb.utils.citation>=0.22
|
|
26
|
+
Requires-Dist: rcsb.utils.config>=0.40
|
|
27
|
+
Requires-Dist: rcsb.utils.ec>=0.25
|
|
28
|
+
Requires-Dist: rcsb.utils.go>=0.18
|
|
29
|
+
Requires-Dist: rcsb.utils.seq>=0.79
|
|
30
|
+
Requires-Dist: rcsb.utils.struct>=0.47
|
|
31
|
+
Requires-Dist: rcsb.utils.taxonomy>=0.43
|
|
32
|
+
Requires-Dist: rcsb.utils.dictionary>=1.24
|
|
33
33
|
Requires-Dist: rcsb.workflow>=0.42
|
|
34
34
|
Requires-Dist: statistics; python_version < "3.0"
|
|
35
35
|
Provides-Extra: dev
|
|
@@ -0,0 +1,25 @@
|
|
|
1
|
+
OpenEye-toolkits>=2020.2.2
|
|
2
|
+
numpy
|
|
3
|
+
jsonschema>=2.6.0
|
|
4
|
+
rcsb.utils.io>=1.46
|
|
5
|
+
rcsb.db>=1.721
|
|
6
|
+
rcsb.utils.chem>=0.79
|
|
7
|
+
rcsb.utils.chemref>=0.91
|
|
8
|
+
rcsb.utils.citation>=0.22
|
|
9
|
+
rcsb.utils.config>=0.40
|
|
10
|
+
rcsb.utils.ec>=0.25
|
|
11
|
+
rcsb.utils.go>=0.18
|
|
12
|
+
rcsb.utils.seq>=0.79
|
|
13
|
+
rcsb.utils.struct>=0.47
|
|
14
|
+
rcsb.utils.taxonomy>=0.43
|
|
15
|
+
rcsb.utils.dictionary>=1.24
|
|
16
|
+
rcsb.workflow>=0.42
|
|
17
|
+
|
|
18
|
+
[:python_version < "3.0"]
|
|
19
|
+
statistics
|
|
20
|
+
|
|
21
|
+
[dev]
|
|
22
|
+
check-manifest
|
|
23
|
+
|
|
24
|
+
[test]
|
|
25
|
+
coverage
|
|
@@ -0,0 +1,18 @@
|
|
|
1
|
+
--extra-index-url https://pypi.anaconda.org/OpenEye/simple
|
|
2
|
+
OpenEye-toolkits >= 2020.2.2
|
|
3
|
+
numpy
|
|
4
|
+
jsonschema >= 2.6.0
|
|
5
|
+
rcsb.utils.io >= 1.46
|
|
6
|
+
rcsb.db >= 1.721
|
|
7
|
+
rcsb.utils.chem >= 0.79
|
|
8
|
+
rcsb.utils.chemref >= 0.91
|
|
9
|
+
rcsb.utils.citation >= 0.22
|
|
10
|
+
rcsb.utils.config >= 0.40
|
|
11
|
+
rcsb.utils.ec >= 0.25
|
|
12
|
+
rcsb.utils.go >= 0.18
|
|
13
|
+
rcsb.utils.seq >= 0.79
|
|
14
|
+
rcsb.utils.struct >= 0.47
|
|
15
|
+
rcsb.utils.taxonomy >= 0.43
|
|
16
|
+
rcsb.utils.dictionary >= 1.24
|
|
17
|
+
rcsb.workflow >= 0.42
|
|
18
|
+
statistics; python_version < "3.0"
|
|
@@ -1,25 +0,0 @@
|
|
|
1
|
-
OpenEye-toolkits>=2020.2.2
|
|
2
|
-
numpy
|
|
3
|
-
jsonschema>=2.6.0
|
|
4
|
-
rcsb.utils.io>=1.28
|
|
5
|
-
rcsb.db>=1.691
|
|
6
|
-
rcsb.utils.chemref>=0.79
|
|
7
|
-
rcsb.utils.chem>=0.75
|
|
8
|
-
rcsb.utils.citation>=0.16
|
|
9
|
-
rcsb.utils.config>=0.35
|
|
10
|
-
rcsb.utils.ec>=0.22
|
|
11
|
-
rcsb.utils.go>=0.17
|
|
12
|
-
rcsb.utils.seq>=0.63
|
|
13
|
-
rcsb.utils.struct>=0.37
|
|
14
|
-
rcsb.utils.taxonomy>=0.39
|
|
15
|
-
rcsb.utils.dictionary>=0.71
|
|
16
|
-
rcsb.workflow>=0.42
|
|
17
|
-
|
|
18
|
-
[:python_version < "3.0"]
|
|
19
|
-
statistics
|
|
20
|
-
|
|
21
|
-
[dev]
|
|
22
|
-
check-manifest
|
|
23
|
-
|
|
24
|
-
[test]
|
|
25
|
-
coverage
|
rcsb_exdb-1.1/requirements.txt
DELETED
|
@@ -1,18 +0,0 @@
|
|
|
1
|
-
--extra-index-url https://pypi.anaconda.org/OpenEye/simple
|
|
2
|
-
OpenEye-toolkits >= 2020.2.2
|
|
3
|
-
numpy
|
|
4
|
-
jsonschema >= 2.6.0
|
|
5
|
-
rcsb.utils.io >= 1.28
|
|
6
|
-
rcsb.db >= 1.691
|
|
7
|
-
rcsb.utils.chemref >= 0.79
|
|
8
|
-
rcsb.utils.chem >= 0.75
|
|
9
|
-
rcsb.utils.citation >= 0.16
|
|
10
|
-
rcsb.utils.config >= 0.35
|
|
11
|
-
rcsb.utils.ec >= 0.22
|
|
12
|
-
rcsb.utils.go >= 0.17
|
|
13
|
-
rcsb.utils.seq >= 0.63
|
|
14
|
-
rcsb.utils.struct >= 0.37
|
|
15
|
-
rcsb.utils.taxonomy >= 0.39
|
|
16
|
-
rcsb.utils.dictionary >= 0.71
|
|
17
|
-
rcsb.workflow >= 0.42
|
|
18
|
-
statistics; python_version < "3.0"
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{rcsb_exdb-1.1 → rcsb_exdb-1.21}/rcsb/exdb/tests/testReferenceSequenceAssignmentAdapterValidate.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|