rcsb.exdb 1.25__tar.gz → 1.26__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (96) hide show
  1. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/HISTORY.txt +2 -0
  2. {rcsb_exdb-1.25/rcsb.exdb.egg-info → rcsb_exdb-1.26}/PKG-INFO +2 -2
  3. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/cli/__init__.py +1 -1
  4. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/seq/PolymerEntityExtractor.py +7 -1
  5. {rcsb_exdb-1.25 → rcsb_exdb-1.26/rcsb.exdb.egg-info}/PKG-INFO +2 -2
  6. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb.exdb.egg-info/requires.txt +1 -1
  7. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/requirements.txt +1 -1
  8. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/LICENSE +0 -0
  9. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/MANIFEST.in +0 -0
  10. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/README.md +0 -0
  11. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/__init__.py +0 -0
  12. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/__init__.py +0 -0
  13. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/branch/BranchedEntityExtractor.py +0 -0
  14. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/branch/GlycanProvider.py +0 -0
  15. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/branch/GlycanUtils.py +0 -0
  16. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/branch/__init__.py +0 -0
  17. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/chemref/ChemRefEtlWorker.py +0 -0
  18. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/chemref/ChemRefExtractor.py +0 -0
  19. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/chemref/ChemRefMappingProvider.py +0 -0
  20. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/chemref/PubChemDataCacheProvider.py +0 -0
  21. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/chemref/PubChemEtlWrapper.py +0 -0
  22. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/chemref/PubChemIndexCacheProvider.py +0 -0
  23. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/chemref/__init__.py +0 -0
  24. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/citation/CitationAdapter.py +0 -0
  25. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/citation/CitationExtractor.py +0 -0
  26. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/citation/CitationUtils.py +0 -0
  27. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/citation/__init__.py +0 -0
  28. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/cli/ExDbExec.py +0 -0
  29. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/entry/EntryInfoProvider.py +0 -0
  30. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/entry/__init__.py +0 -0
  31. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/seq/AnnotationExtractor.py +0 -0
  32. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/seq/LigandNeighborMappingExtractor.py +0 -0
  33. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/seq/LigandNeighborMappingProvider.py +0 -0
  34. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/seq/ReferenceSequenceAnnotationAdapter.py +0 -0
  35. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/seq/ReferenceSequenceAnnotationProvider.py +0 -0
  36. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/seq/ReferenceSequenceAssignmentAdapter.py +0 -0
  37. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/seq/ReferenceSequenceAssignmentProvider.py +0 -0
  38. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/seq/ReferenceSequenceCacheProvider.py +0 -0
  39. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/seq/TaxonomyExtractor.py +0 -0
  40. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/seq/UniProtCoreEtlWorker.py +0 -0
  41. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/seq/UniProtExtractor.py +0 -0
  42. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/seq/__init__.py +0 -0
  43. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/__init__.py +0 -0
  44. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/fixtureDictMethodResourceProvider.py +0 -0
  45. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/fixturePdbxLoader.py +0 -0
  46. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testAnnotationExtractor.py +0 -0
  47. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testBranchedEntityExtractor.py +0 -0
  48. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testChemRefLoader.py +0 -0
  49. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testChemRefMappingProvider.py +0 -0
  50. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testCitationAdapter.py +0 -0
  51. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testCitationExtractor.py +0 -0
  52. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testCitationUtils.py +0 -0
  53. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testEntryInfoEtlWorkflow.py +0 -0
  54. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testEntryInfoProvider.py +0 -0
  55. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testExDbWorkflow.py +0 -0
  56. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testGlycanEtlWorkflow.py +0 -0
  57. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testGlycanProvider.py +0 -0
  58. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testGlycanUtils.py +0 -0
  59. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testLigandNeighborMappingProvider.py +0 -0
  60. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testObjectExtractor.py +0 -0
  61. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testObjectTransformer.py +0 -0
  62. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testObjectUpdater.py +0 -0
  63. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testPolymerEntityExtractor.py +0 -0
  64. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testPubChemDataCacheProvider.py +0 -0
  65. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testPubChemEtlWorkflow.py +0 -0
  66. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testPubChemEtlWrapper.py +0 -0
  67. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testPubChemIndexCacheProvider.py +0 -0
  68. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testReferenceSequenceAnnotationAdapter.py +0 -0
  69. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testReferenceSequenceAssignmentAdapter.py +0 -0
  70. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testReferenceSequenceAssignmentAdapterValidate.py +0 -0
  71. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testReferenceSequenceAssignmentProvider.py +0 -0
  72. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testReferenceSequenceCacheProvider.py +0 -0
  73. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testTaxonomyExtractor.py +0 -0
  74. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testTreeNodeListWorker.py +0 -0
  75. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testUniProtCoreEtlWorker.py +0 -0
  76. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tests/testUniProtExtractor.py +0 -0
  77. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tree/TreeNodeListWorker.py +0 -0
  78. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/tree/__init__.py +0 -0
  79. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/utils/ObjectAdapterBase.py +0 -0
  80. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/utils/ObjectExtractor.py +0 -0
  81. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/utils/ObjectTransformer.py +0 -0
  82. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/utils/ObjectUpdater.py +0 -0
  83. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/utils/ObjectValidator.py +0 -0
  84. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/utils/__init__.py +0 -0
  85. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/wf/EntryInfoEtlWorkflow.py +0 -0
  86. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/wf/ExDbWorkflow.py +0 -0
  87. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/wf/GlycanEtlWorkflow.py +0 -0
  88. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/wf/PubChemEtlWorkflow.py +0 -0
  89. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb/exdb/wf/__init__.py +0 -0
  90. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb.exdb.egg-info/SOURCES.txt +0 -0
  91. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb.exdb.egg-info/dependency_links.txt +0 -0
  92. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb.exdb.egg-info/entry_points.txt +0 -0
  93. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb.exdb.egg-info/not-zip-safe +0 -0
  94. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/rcsb.exdb.egg-info/top_level.txt +0 -0
  95. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/setup.cfg +0 -0
  96. {rcsb_exdb-1.25 → rcsb_exdb-1.26}/setup.py +0 -0
@@ -106,3 +106,5 @@
106
106
  27-Aug-2024 V1.24 Update tree loading for CARD ontology data
107
107
  22-Oct-2024 V1.25 Add CLI for CCD image and file generation;
108
108
  Update CI/CD to python 3.10
109
+ 10-Dec-2024 V1.26 Update PolymerEntityExtractor to sort extracted sequence data;
110
+ Update Azure pipelines to run on latest macOS and ubuntu version
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: rcsb.exdb
3
- Version: 1.25
3
+ Version: 1.26
4
4
  Summary: RCSB Python ExDB data extraction and loading workflows
5
5
  Home-page: https://github.com/rcsb/py-rcsb_exdb
6
6
  Author: John Westbrook
@@ -28,7 +28,7 @@ Requires-Dist: rcsb.utils.config>=0.40
28
28
  Requires-Dist: rcsb.utils.ec>=0.25
29
29
  Requires-Dist: rcsb.utils.go>=0.18
30
30
  Requires-Dist: rcsb.utils.seq>=0.82
31
- Requires-Dist: rcsb.utils.seqalign>=0.29
31
+ Requires-Dist: rcsb.utils.seqalign>=0.31
32
32
  Requires-Dist: rcsb.utils.targets>=0.82
33
33
  Requires-Dist: rcsb.utils.struct>=0.47
34
34
  Requires-Dist: rcsb.utils.taxonomy>=0.43
@@ -2,4 +2,4 @@ __docformat__ = "google en"
2
2
  __author__ = "John Westbrook"
3
3
  __email__ = "john.westbrook@rcsb.org"
4
4
  __license__ = "Apache 2.0"
5
- __version__ = "1.25"
5
+ __version__ = "1.26"
@@ -7,6 +7,8 @@
7
7
  #
8
8
  # Updates:
9
9
  # 9-Jan-2024 dwp Turn off use of uniprot_exdb DB for enriching protein entity details file (data not used)
10
+ # 10-Dec-2024 dwp Sort extracted polymer entity sequence data by entity ID (alphabetically), to ensure consistent
11
+ # ordering between coasts (order of sequence data influences results of mmseqs2 sequence searching)
10
12
  #
11
13
  ##
12
14
  __docformat__ = "google en"
@@ -16,6 +18,7 @@ __license__ = "Apache 2.0"
16
18
 
17
19
  import logging
18
20
  import os
21
+ from collections import OrderedDict
19
22
 
20
23
  from rcsb.exdb.utils.ObjectExtractor import ObjectExtractor
21
24
  from rcsb.utils.io.MarshalUtil import MarshalUtil
@@ -175,9 +178,12 @@ class PolymerEntityExtractor(object):
175
178
  pass
176
179
  rD[rId] = {"alignmentL": uDL, "sourceOrgL": sL, "partCount": partCount, "taxCount": taxCount, "sequence": seqS, "seqLen": seqLen}
177
180
 
181
+ # Sort the dict in alphabetical order (by entity ID key) to ensure consistent/reproducible treatment by mmseqs2
182
+ sortedD = OrderedDict((k, rD.pop(k)) for k in sorted(rD))
183
+
178
184
  except Exception as e:
179
185
  logger.exception("Failing with %s", str(e))
180
- return rD, missingSrcD
186
+ return sortedD, missingSrcD
181
187
 
182
188
  def __getSourcePart(self, entityId, sourceOrgL, entityBeg, seqLen):
183
189
  """Return the source part containing the input entity range -
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: rcsb.exdb
3
- Version: 1.25
3
+ Version: 1.26
4
4
  Summary: RCSB Python ExDB data extraction and loading workflows
5
5
  Home-page: https://github.com/rcsb/py-rcsb_exdb
6
6
  Author: John Westbrook
@@ -28,7 +28,7 @@ Requires-Dist: rcsb.utils.config>=0.40
28
28
  Requires-Dist: rcsb.utils.ec>=0.25
29
29
  Requires-Dist: rcsb.utils.go>=0.18
30
30
  Requires-Dist: rcsb.utils.seq>=0.82
31
- Requires-Dist: rcsb.utils.seqalign>=0.29
31
+ Requires-Dist: rcsb.utils.seqalign>=0.31
32
32
  Requires-Dist: rcsb.utils.targets>=0.82
33
33
  Requires-Dist: rcsb.utils.struct>=0.47
34
34
  Requires-Dist: rcsb.utils.taxonomy>=0.43
@@ -10,7 +10,7 @@ rcsb.utils.config>=0.40
10
10
  rcsb.utils.ec>=0.25
11
11
  rcsb.utils.go>=0.18
12
12
  rcsb.utils.seq>=0.82
13
- rcsb.utils.seqalign>=0.29
13
+ rcsb.utils.seqalign>=0.31
14
14
  rcsb.utils.targets>=0.82
15
15
  rcsb.utils.struct>=0.47
16
16
  rcsb.utils.taxonomy>=0.43
@@ -11,7 +11,7 @@ rcsb.utils.config >= 0.40
11
11
  rcsb.utils.ec >= 0.25
12
12
  rcsb.utils.go >= 0.18
13
13
  rcsb.utils.seq >= 0.82
14
- rcsb.utils.seqalign >= 0.29
14
+ rcsb.utils.seqalign >= 0.31
15
15
  rcsb.utils.targets >= 0.82
16
16
  rcsb.utils.struct >= 0.47
17
17
  rcsb.utils.taxonomy >= 0.43
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes