rcsb.exdb 1.33__py3-none-any.whl → 1.34__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -9,6 +9,7 @@
9
9
  # 9-Jan-2024 dwp Turn off use of uniprot_exdb DB for enriching protein entity details file (data not used)
10
10
  # 10-Dec-2024 dwp Sort extracted polymer entity sequence data by entity ID (alphabetically), to ensure consistent
11
11
  # ordering between coasts (order of sequence data influences results of mmseqs2 sequence searching)
12
+ # 2-Feb-2026 dwp Handle case of missing 'rcsb_entity_source_organism.source_type'
12
13
  #
13
14
  ##
14
15
  __docformat__ = "google en"
@@ -115,7 +116,7 @@ class PolymerEntityExtractor(object):
115
116
  begSeqNum = 1
116
117
  endSeqNum = seqLen
117
118
  srcId = tD["pdbx_src_id"]
118
- srcType = tD["source_type"]
119
+ srcType = tD["source_type"] if "source_type" in tD else None
119
120
  taxId = tD["ncbi_taxonomy_id"] if "ncbi_taxonomy_id" in tD else -1
120
121
  if srcName and taxId == -1:
121
122
  missingSrcD.setdefault(srcName, []).append(rId)
@@ -138,7 +139,7 @@ class PolymerEntityExtractor(object):
138
139
  pD = eD["rcsb_polymer_entity"]
139
140
  taxCount = pD["rcsb_source_taxonomy_count"]
140
141
  except Exception:
141
- if srcType == "synthetic":
142
+ if srcType is not None and srcType == "synthetic":
142
143
  taxCount = 0
143
144
  else:
144
145
  logger.warning("%s (srcName %r) no source taxonomy count type %r", rId, srcName, srcType)
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: rcsb.exdb
3
- Version: 1.33
3
+ Version: 1.34
4
4
  Summary: RCSB Python ExDB data extraction and loading workflows
5
5
  Project-URL: Homepage, https://github.com/rcsb/py-rcsb_exdb
6
6
  Author-email: John Westbrook <john.westbrook@rcsb.org>
@@ -33,7 +33,7 @@ rcsb/exdb/examples-seq/testReferenceSequenceUtils.py,sha256=JIpQsyVfU9sx-50ludlD
33
33
  rcsb/exdb/seq/AnnotationExtractor.py,sha256=8iCE8LJR7QH8ilSWDkpKYQSfVuSvorlnM9VHIIYcRoY,2741
34
34
  rcsb/exdb/seq/LigandNeighborMappingExtractor.py,sha256=PpRWunQHZ6j8s6MCu1tuY59cocEoUvM3bIUcsvQ-Ijo,3431
35
35
  rcsb/exdb/seq/LigandNeighborMappingProvider.py,sha256=vzy2tJGB6IgDNgSHyzGU3TuTOV9cfWI_eLRkO3apQtk,3741
36
- rcsb/exdb/seq/PolymerEntityExtractor.py,sha256=YPyK0F90mjHCBc_vqZdAvBcDecAcOHUax4TxGToEzmg,15004
36
+ rcsb/exdb/seq/PolymerEntityExtractor.py,sha256=7Vf50e4aCwBJ_0nMuPrlMLU3dyQMD_T2w-YtoawKInc,15144
37
37
  rcsb/exdb/seq/ReferenceSequenceAnnotationAdapter.py,sha256=VXStOXoZcbFGYOm5eYiqn599BNksG87h3kzK_aQz2Xc,31160
38
38
  rcsb/exdb/seq/ReferenceSequenceAnnotationProvider.py,sha256=2fbNeH1VkxEPpny0lfaTJ-UGEXQjxTdQbUoeiTRbJuU,9560
39
39
  rcsb/exdb/seq/ReferenceSequenceAssignmentAdapter.py,sha256=P-t4w4uvnx4qv_vBAJwKuBGjo6wOIYZ8IKzGaw2bCQ8,25935
@@ -55,7 +55,7 @@ rcsb/exdb/wf/EntryInfoEtlWorkflow.py,sha256=YVr75Wz1BPjLr_satd28B9BeD3QL6HwmkR17
55
55
  rcsb/exdb/wf/GlycanEtlWorkflow.py,sha256=oJ6wf438K2e-eLmy8Ni3MCPxjAKgVJY38SWO885gnmg,2820
56
56
  rcsb/exdb/wf/PubChemEtlWorkflow.py,sha256=fNX3A6kf0S1XiJMz7ywNpFuuua5lT3XaUFjcCJtvQsU,11235
57
57
  rcsb/exdb/wf/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
58
- rcsb_exdb-1.33.dist-info/METADATA,sha256=0_XboU3Pyut6e2JCDds5wE4pPVFJHGoCMnlvOtZckME,3845
59
- rcsb_exdb-1.33.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
60
- rcsb_exdb-1.33.dist-info/licenses/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
61
- rcsb_exdb-1.33.dist-info/RECORD,,
58
+ rcsb_exdb-1.34.dist-info/METADATA,sha256=nfmbDBYh52noNUURQXRnqS8ksTzLd_46fINrsstMmkc,3845
59
+ rcsb_exdb-1.34.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
60
+ rcsb_exdb-1.34.dist-info/licenses/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
61
+ rcsb_exdb-1.34.dist-info/RECORD,,