dcicutils 8.8.1.1b26__py3-none-any.whl → 8.8.1.1b28__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -195,7 +195,7 @@ class PortalObject:
195
195
  # sure we check accession format (since it does not have a pattern).
196
196
  if callable(ref_lookup_strategy):
197
197
  lookup_options, ref_validator = ref_lookup_strategy(
198
- self.type, schema, identifying_value)
198
+ self._portal, self.type, schema, identifying_value)
199
199
  if callable(ref_validator):
200
200
  if ref_validator(schema, identifying_property, identifying_value) is False:
201
201
  continue
@@ -822,7 +822,7 @@ class Portal(PortalBase):
822
822
  if callable(ref_lookup_strategy):
823
823
  self._ref_lookup_strategy = ref_lookup_strategy
824
824
  else:
825
- self._ref_lookup_strategy = lambda type_name, schema, value: (Portal.LOOKUP_DEFAULT, None)
825
+ self._ref_lookup_strategy = lambda portal, type_name, schema, value: (Portal.LOOKUP_DEFAULT, None)
826
826
  if ref_lookup_nocache is True:
827
827
  self.ref_lookup = self.ref_lookup_uncached
828
828
  self._ref_cache = None
@@ -860,10 +860,6 @@ class Portal(PortalBase):
860
860
  @lru_cache(maxsize=100)
861
861
  def get_schema(self, schema_name: str) -> Optional[dict]:
862
862
  return schemas.get(Schema.type_name(schema_name), None) if (schemas := self.get_schemas()) else None
863
- # if schema_name == schema_name.upper() and (schema := schemas.get(schema_name.lower().title())):
864
- # return schema
865
- # if schema_name == schema_name.lower() and (schema := schemas.get(schema_name.title())):
866
- # return schema
867
863
 
868
864
  @lru_cache(maxsize=1)
869
865
  def get_schemas(self) -> Optional[dict]:
@@ -892,7 +888,7 @@ class Portal(PortalBase):
892
888
  self._ref_total_count += 1
893
889
  # First make sure the given value can possibly be a reference to the given type.
894
890
  schema = self.get_schema(type_name)
895
- ref_lookup_strategy, ref_validator = self._ref_lookup_strategy(type_name, schema, value)
891
+ ref_lookup_flags, ref_validator = self._ref_lookup_strategy(self, type_name, schema, value)
896
892
  if not self._is_valid_ref(type_name, value, ref_validator):
897
893
  if called_from_map_ref:
898
894
  self._ref_invalid_identifying_property_count += 1
@@ -922,11 +918,11 @@ class Portal(PortalBase):
922
918
  # Get the lookup strategy; i.e. should do we lookup by root path, and if so, should
923
919
  # we do this first, and do we lookup by subtypes; by default we lookup by root path
924
920
  # but not first, and we also lookup by subtypes by default.
925
- ref_lookup_strategy, _ = self._ref_lookup_strategy(type_name, self.get_schema(type_name), value)
926
- is_ref_lookup_specified_type = StructuredDataSet._is_ref_lookup_specified_type(ref_lookup_strategy)
927
- is_ref_lookup_root = StructuredDataSet._is_ref_lookup_root(ref_lookup_strategy)
928
- is_ref_lookup_root_first = StructuredDataSet._is_ref_lookup_root_first(ref_lookup_strategy)
929
- is_ref_lookup_subtypes = StructuredDataSet._is_ref_lookup_subtypes(ref_lookup_strategy)
921
+ ref_lookup_flags, _ = self._ref_lookup_strategy(self, type_name, self.get_schema(type_name), value)
922
+ is_ref_lookup_specified_type = StructuredDataSet._is_ref_lookup_specified_type(ref_lookup_flags)
923
+ is_ref_lookup_root = StructuredDataSet._is_ref_lookup_root(ref_lookup_flags)
924
+ is_ref_lookup_root_first = StructuredDataSet._is_ref_lookup_root_first(ref_lookup_flags)
925
+ is_ref_lookup_subtypes = StructuredDataSet._is_ref_lookup_subtypes(ref_lookup_flags)
930
926
  # First construct the list of lookup paths at which to look for the referenced item.
931
927
  lookup_paths = []
932
928
  if is_ref_lookup_root_first:
@@ -971,9 +967,9 @@ class Portal(PortalBase):
971
967
  if not type_name or not value:
972
968
  return None # Should not happen.
973
969
  # Note that root lookup not applicable here.
974
- ref_lookup_strategy, ref_validator = (
975
- self._ref_lookup_strategy(type_name, self.get_schema(type_name), value))
976
- is_ref_lookup_subtypes = StructuredDataSet._is_ref_lookup_subtypes(ref_lookup_strategy)
970
+ ref_lookup_flags, ref_validator = (
971
+ self._ref_lookup_strategy(self, type_name, self.get_schema(type_name), value))
972
+ is_ref_lookup_subtypes = StructuredDataSet._is_ref_lookup_subtypes(ref_lookup_flags)
977
973
  subtype_names = self.get_schema_subtype_names(type_name) if is_ref_lookup_subtypes else []
978
974
  for type_name in [type_name] + subtype_names:
979
975
  is_resolved, resolved_item = self._ref_exists_single_internally(type_name, value)
@@ -0,0 +1,67 @@
1
+ import re
2
+ from typing import Optional
3
+ from dcicutils.structured_data import Portal
4
+
5
+
6
+ def ref_lookup_strategy(portal: Portal, type_name: str, schema: dict, value: str) -> (int, Optional[str]):
7
+ #
8
+ # FYI: Note this situation WRT object lookups ...
9
+ #
10
+ # /{submitted_id} # NOT FOUND
11
+ # /UnalignedReads/{submitted_id} # OK
12
+ # /SubmittedFile/{submitted_id} # OK
13
+ # /File/{submitted_id} # NOT FOUND
14
+ #
15
+ # /{accession} # OK
16
+ # /UnalignedReads/{accession} # NOT FOUND
17
+ # /SubmittedFile/{accession} # NOT FOUND
18
+ # /File/{accession} # OK
19
+ #
20
+ def ref_validator(schema: Optional[dict],
21
+ property_name: Optional[str], property_value: Optional[str]) -> Optional[bool]:
22
+ """
23
+ Returns False iff the type represented by the given schema, can NOT be referenced by
24
+ the given property name with the given property value, otherwise returns None.
25
+
26
+ For example, if the schema is for the UnalignedReads type and the property name
27
+ is accession, then we will return False iff the given property value is NOT a properly
28
+ formatted accession ID. Otherwise, we will return None, which indicates that the
29
+ caller (in dcicutils.structured_data.Portal.ref_exists) will continue executing
30
+ its default behavior, which is to check other ways in which the given type can NOT
31
+ be referenced by the given value, i.e. it checks other identifying properties for
32
+ the type and makes sure any patterns (e.g. for submitted_id or uuid) are ahered to.
33
+
34
+ The goal (in structured_data) being to detect if a type is being referenced in such
35
+ a way that cannot possibly be allowed, i.e. because none of its identifying types
36
+ are in the required form (if indeed there any requirements). Note that it is guaranteed
37
+ that the given property name is indeed an identifying property for the given type.
38
+ """
39
+ if property_format := schema.get("properties", {}).get(property_name, {}).get("format"):
40
+ if (property_format == "accession") and (property_name == "accession"):
41
+ if not _is_accession_id(property_value):
42
+ return False
43
+ return None
44
+
45
+ DEFAULT_RESPONSE = (Portal.LOOKUP_DEFAULT, ref_validator)
46
+
47
+ if not value:
48
+ return DEFAULT_RESPONSE
49
+ if not schema:
50
+ if not isinstance(portal, Portal) or not (schema := portal.get_schema(type_name)):
51
+ return DEFAULT_RESPONSE
52
+ if schema_properties := schema.get("properties"):
53
+ if schema_properties.get("accession") and _is_accession_id(value):
54
+ # Case: lookup by accession (only by root).
55
+ return Portal.LOOKUP_ROOT, ref_validator
56
+ elif schema_property_info_submitted_id := schema_properties.get("submitted_id"):
57
+ if schema_property_pattern_submitted_id := schema_property_info_submitted_id.get("pattern"):
58
+ if re.match(schema_property_pattern_submitted_id, value):
59
+ # Case: lookup by submitted_id (only by specified type).
60
+ return Portal.LOOKUP_SPECIFIED_TYPE, ref_validator
61
+ return DEFAULT_RESPONSE
62
+
63
+
64
+ # This is here for now because of problems with circular dependencies.
65
+ # See: smaht-portal/.../schema_formats.py
66
+ def _is_accession_id(value: str) -> bool:
67
+ return isinstance(value, str) and re.match(r"^SMA[1-9A-Z]{9}$", value) is not None
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: dcicutils
3
- Version: 8.8.1.1b26
3
+ Version: 8.8.1.1b28
4
4
  Summary: Utility package for interacting with the 4DN Data Portal and other 4DN resources
5
5
  Home-page: https://github.com/4dn-dcic/utils
6
6
  License: MIT
@@ -46,7 +46,7 @@ dcicutils/log_utils.py,sha256=7pWMc6vyrorUZQf-V-M3YC6zrPgNhuV_fzm9xqTPph0,10883
46
46
  dcicutils/misc_utils.py,sha256=zVc4urdVGgnWjQ4UQlrGH-URAzr2l_PwZWI3u_GJdFE,102210
47
47
  dcicutils/obfuscation_utils.py,sha256=fo2jOmDRC6xWpYX49u80bVNisqRRoPskFNX3ymFAmjw,5963
48
48
  dcicutils/opensearch_utils.py,sha256=V2exmFYW8Xl2_pGFixF4I2Cc549Opwe4PhFi5twC0M8,1017
49
- dcicutils/portal_object_utils.py,sha256=MF6MTZ6yxakZFDjbkTKCsF4q4p11dLDVvT5JBV9m6RQ,15408
49
+ dcicutils/portal_object_utils.py,sha256=gDXRgPsRvqCFwbC8WatsuflAxNiigOnqr0Hi93k3AgE,15422
50
50
  dcicutils/portal_utils.py,sha256=oBoI3KWRp6YrbsuVGbmPQ3kATB5cVVsQo7-qmnYXWqg,30260
51
51
  dcicutils/project_utils.py,sha256=qPdCaFmWUVBJw4rw342iUytwdQC0P-XKpK4mhyIulMM,31250
52
52
  dcicutils/qa_checkers.py,sha256=cdXjeL0jCDFDLT8VR8Px78aS10hwNISOO5G_Zv2TZ6M,20534
@@ -62,16 +62,17 @@ dcicutils/secrets_utils.py,sha256=8dppXAsiHhJzI6NmOcvJV5ldvKkQZzh3Fl-cb8Wm7MI,19
62
62
  dcicutils/sheet_utils.py,sha256=VlmzteONW5VF_Q4vo0yA5vesz1ViUah1MZ_yA1rwZ0M,33629
63
63
  dcicutils/snapshot_utils.py,sha256=ymP7PXH6-yEiXAt75w0ldQFciGNqWBClNxC5gfX2FnY,22961
64
64
  dcicutils/ssl_certificate_utils.py,sha256=F0ifz_wnRRN9dfrfsz7aCp4UDLgHEY8LaK7PjnNvrAQ,9707
65
- dcicutils/structured_data.py,sha256=Tgl4ibUQ0O8N5UHDHzPuGQ6HAcu2LkU64kd4CAoxxgQ,58701
65
+ dcicutils/structured_data.py,sha256=IjiLOLsxtINOEaz3oVSEscA4lW-t6u9dFfW-NRCRmfs,58451
66
66
  dcicutils/submitr/progress_constants.py,sha256=5bxyX77ql8qEJearfHEvsvXl7D0GuUODW0T65mbRmnE,2895
67
+ dcicutils/submitr/ref_lookup_strategy.py,sha256=Js2cVznTmgjciLWBPLCvMiwLIHXjDn3jww-gJPjYuFw,3467
67
68
  dcicutils/task_utils.py,sha256=MF8ujmTD6-O2AC2gRGPHyGdUrVKgtr8epT5XU8WtNjk,8082
68
69
  dcicutils/tmpfile_utils.py,sha256=n95XF8dZVbQRSXBZTGToXXfSs3JUVRyN6c3ZZ0nhAWI,1403
69
70
  dcicutils/trace_utils.py,sha256=g8kwV4ebEy5kXW6oOrEAUsurBcCROvwtZqz9fczsGRE,1769
70
71
  dcicutils/validation_utils.py,sha256=cMZIU2cY98FYtzK52z5WUYck7urH6JcqOuz9jkXpqzg,14797
71
72
  dcicutils/variant_utils.py,sha256=2H9azNx3xAj-MySg-uZ2SFqbWs4kZvf61JnK6b-h4Qw,4343
72
73
  dcicutils/zip_utils.py,sha256=rnjNv_k6L9jT2SjDSgVXp4BEJYLtz9XN6Cl2Fy-tqnM,2027
73
- dcicutils-8.8.1.1b26.dist-info/LICENSE.txt,sha256=qnwSmfnEWMl5l78VPDEzAmEbLVrRqQvfUQiHT0ehrOo,1102
74
- dcicutils-8.8.1.1b26.dist-info/METADATA,sha256=LbyQqC3Nz5MOBkoAMUXNXOOBdYfAfvx1qo9D8dBMj7E,3357
75
- dcicutils-8.8.1.1b26.dist-info/WHEEL,sha256=7Z8_27uaHI_UZAc4Uox4PpBhQ9Y5_modZXWMxtUi4NU,88
76
- dcicutils-8.8.1.1b26.dist-info/entry_points.txt,sha256=51Q4F_2V10L0282W7HFjP4jdzW4K8lnWDARJQVFy_hw,270
77
- dcicutils-8.8.1.1b26.dist-info/RECORD,,
74
+ dcicutils-8.8.1.1b28.dist-info/LICENSE.txt,sha256=qnwSmfnEWMl5l78VPDEzAmEbLVrRqQvfUQiHT0ehrOo,1102
75
+ dcicutils-8.8.1.1b28.dist-info/METADATA,sha256=BQjxloCg_4ksew6yyy1O5C9CSZ8VUTQrsqgfq1_K9D4,3357
76
+ dcicutils-8.8.1.1b28.dist-info/WHEEL,sha256=7Z8_27uaHI_UZAc4Uox4PpBhQ9Y5_modZXWMxtUi4NU,88
77
+ dcicutils-8.8.1.1b28.dist-info/entry_points.txt,sha256=51Q4F_2V10L0282W7HFjP4jdzW4K8lnWDARJQVFy_hw,270
78
+ dcicutils-8.8.1.1b28.dist-info/RECORD,,