dcicutils 8.8.1.1b26__py3-none-any.whl → 8.8.1.1b28__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- dcicutils/portal_object_utils.py +1 -1
- dcicutils/structured_data.py +10 -14
- dcicutils/submitr/ref_lookup_strategy.py +67 -0
- {dcicutils-8.8.1.1b26.dist-info → dcicutils-8.8.1.1b28.dist-info}/METADATA +1 -1
- {dcicutils-8.8.1.1b26.dist-info → dcicutils-8.8.1.1b28.dist-info}/RECORD +8 -7
- {dcicutils-8.8.1.1b26.dist-info → dcicutils-8.8.1.1b28.dist-info}/LICENSE.txt +0 -0
- {dcicutils-8.8.1.1b26.dist-info → dcicutils-8.8.1.1b28.dist-info}/WHEEL +0 -0
- {dcicutils-8.8.1.1b26.dist-info → dcicutils-8.8.1.1b28.dist-info}/entry_points.txt +0 -0
dcicutils/portal_object_utils.py
CHANGED
@@ -195,7 +195,7 @@ class PortalObject:
|
|
195
195
|
# sure we check accession format (since it does not have a pattern).
|
196
196
|
if callable(ref_lookup_strategy):
|
197
197
|
lookup_options, ref_validator = ref_lookup_strategy(
|
198
|
-
self.type, schema, identifying_value)
|
198
|
+
self._portal, self.type, schema, identifying_value)
|
199
199
|
if callable(ref_validator):
|
200
200
|
if ref_validator(schema, identifying_property, identifying_value) is False:
|
201
201
|
continue
|
dcicutils/structured_data.py
CHANGED
@@ -822,7 +822,7 @@ class Portal(PortalBase):
|
|
822
822
|
if callable(ref_lookup_strategy):
|
823
823
|
self._ref_lookup_strategy = ref_lookup_strategy
|
824
824
|
else:
|
825
|
-
self._ref_lookup_strategy = lambda type_name, schema, value: (Portal.LOOKUP_DEFAULT, None)
|
825
|
+
self._ref_lookup_strategy = lambda portal, type_name, schema, value: (Portal.LOOKUP_DEFAULT, None)
|
826
826
|
if ref_lookup_nocache is True:
|
827
827
|
self.ref_lookup = self.ref_lookup_uncached
|
828
828
|
self._ref_cache = None
|
@@ -860,10 +860,6 @@ class Portal(PortalBase):
|
|
860
860
|
@lru_cache(maxsize=100)
|
861
861
|
def get_schema(self, schema_name: str) -> Optional[dict]:
|
862
862
|
return schemas.get(Schema.type_name(schema_name), None) if (schemas := self.get_schemas()) else None
|
863
|
-
# if schema_name == schema_name.upper() and (schema := schemas.get(schema_name.lower().title())):
|
864
|
-
# return schema
|
865
|
-
# if schema_name == schema_name.lower() and (schema := schemas.get(schema_name.title())):
|
866
|
-
# return schema
|
867
863
|
|
868
864
|
@lru_cache(maxsize=1)
|
869
865
|
def get_schemas(self) -> Optional[dict]:
|
@@ -892,7 +888,7 @@ class Portal(PortalBase):
|
|
892
888
|
self._ref_total_count += 1
|
893
889
|
# First make sure the given value can possibly be a reference to the given type.
|
894
890
|
schema = self.get_schema(type_name)
|
895
|
-
|
891
|
+
ref_lookup_flags, ref_validator = self._ref_lookup_strategy(self, type_name, schema, value)
|
896
892
|
if not self._is_valid_ref(type_name, value, ref_validator):
|
897
893
|
if called_from_map_ref:
|
898
894
|
self._ref_invalid_identifying_property_count += 1
|
@@ -922,11 +918,11 @@ class Portal(PortalBase):
|
|
922
918
|
# Get the lookup strategy; i.e. should do we lookup by root path, and if so, should
|
923
919
|
# we do this first, and do we lookup by subtypes; by default we lookup by root path
|
924
920
|
# but not first, and we also lookup by subtypes by default.
|
925
|
-
|
926
|
-
is_ref_lookup_specified_type = StructuredDataSet._is_ref_lookup_specified_type(
|
927
|
-
is_ref_lookup_root = StructuredDataSet._is_ref_lookup_root(
|
928
|
-
is_ref_lookup_root_first = StructuredDataSet._is_ref_lookup_root_first(
|
929
|
-
is_ref_lookup_subtypes = StructuredDataSet._is_ref_lookup_subtypes(
|
921
|
+
ref_lookup_flags, _ = self._ref_lookup_strategy(self, type_name, self.get_schema(type_name), value)
|
922
|
+
is_ref_lookup_specified_type = StructuredDataSet._is_ref_lookup_specified_type(ref_lookup_flags)
|
923
|
+
is_ref_lookup_root = StructuredDataSet._is_ref_lookup_root(ref_lookup_flags)
|
924
|
+
is_ref_lookup_root_first = StructuredDataSet._is_ref_lookup_root_first(ref_lookup_flags)
|
925
|
+
is_ref_lookup_subtypes = StructuredDataSet._is_ref_lookup_subtypes(ref_lookup_flags)
|
930
926
|
# First construct the list of lookup paths at which to look for the referenced item.
|
931
927
|
lookup_paths = []
|
932
928
|
if is_ref_lookup_root_first:
|
@@ -971,9 +967,9 @@ class Portal(PortalBase):
|
|
971
967
|
if not type_name or not value:
|
972
968
|
return None # Should not happen.
|
973
969
|
# Note that root lookup not applicable here.
|
974
|
-
|
975
|
-
self._ref_lookup_strategy(type_name, self.get_schema(type_name), value))
|
976
|
-
is_ref_lookup_subtypes = StructuredDataSet._is_ref_lookup_subtypes(
|
970
|
+
ref_lookup_flags, ref_validator = (
|
971
|
+
self._ref_lookup_strategy(self, type_name, self.get_schema(type_name), value))
|
972
|
+
is_ref_lookup_subtypes = StructuredDataSet._is_ref_lookup_subtypes(ref_lookup_flags)
|
977
973
|
subtype_names = self.get_schema_subtype_names(type_name) if is_ref_lookup_subtypes else []
|
978
974
|
for type_name in [type_name] + subtype_names:
|
979
975
|
is_resolved, resolved_item = self._ref_exists_single_internally(type_name, value)
|
@@ -0,0 +1,67 @@
|
|
1
|
+
import re
|
2
|
+
from typing import Optional
|
3
|
+
from dcicutils.structured_data import Portal
|
4
|
+
|
5
|
+
|
6
|
+
def ref_lookup_strategy(portal: Portal, type_name: str, schema: dict, value: str) -> (int, Optional[str]):
|
7
|
+
#
|
8
|
+
# FYI: Note this situation WRT object lookups ...
|
9
|
+
#
|
10
|
+
# /{submitted_id} # NOT FOUND
|
11
|
+
# /UnalignedReads/{submitted_id} # OK
|
12
|
+
# /SubmittedFile/{submitted_id} # OK
|
13
|
+
# /File/{submitted_id} # NOT FOUND
|
14
|
+
#
|
15
|
+
# /{accession} # OK
|
16
|
+
# /UnalignedReads/{accession} # NOT FOUND
|
17
|
+
# /SubmittedFile/{accession} # NOT FOUND
|
18
|
+
# /File/{accession} # OK
|
19
|
+
#
|
20
|
+
def ref_validator(schema: Optional[dict],
|
21
|
+
property_name: Optional[str], property_value: Optional[str]) -> Optional[bool]:
|
22
|
+
"""
|
23
|
+
Returns False iff the type represented by the given schema, can NOT be referenced by
|
24
|
+
the given property name with the given property value, otherwise returns None.
|
25
|
+
|
26
|
+
For example, if the schema is for the UnalignedReads type and the property name
|
27
|
+
is accession, then we will return False iff the given property value is NOT a properly
|
28
|
+
formatted accession ID. Otherwise, we will return None, which indicates that the
|
29
|
+
caller (in dcicutils.structured_data.Portal.ref_exists) will continue executing
|
30
|
+
its default behavior, which is to check other ways in which the given type can NOT
|
31
|
+
be referenced by the given value, i.e. it checks other identifying properties for
|
32
|
+
the type and makes sure any patterns (e.g. for submitted_id or uuid) are ahered to.
|
33
|
+
|
34
|
+
The goal (in structured_data) being to detect if a type is being referenced in such
|
35
|
+
a way that cannot possibly be allowed, i.e. because none of its identifying types
|
36
|
+
are in the required form (if indeed there any requirements). Note that it is guaranteed
|
37
|
+
that the given property name is indeed an identifying property for the given type.
|
38
|
+
"""
|
39
|
+
if property_format := schema.get("properties", {}).get(property_name, {}).get("format"):
|
40
|
+
if (property_format == "accession") and (property_name == "accession"):
|
41
|
+
if not _is_accession_id(property_value):
|
42
|
+
return False
|
43
|
+
return None
|
44
|
+
|
45
|
+
DEFAULT_RESPONSE = (Portal.LOOKUP_DEFAULT, ref_validator)
|
46
|
+
|
47
|
+
if not value:
|
48
|
+
return DEFAULT_RESPONSE
|
49
|
+
if not schema:
|
50
|
+
if not isinstance(portal, Portal) or not (schema := portal.get_schema(type_name)):
|
51
|
+
return DEFAULT_RESPONSE
|
52
|
+
if schema_properties := schema.get("properties"):
|
53
|
+
if schema_properties.get("accession") and _is_accession_id(value):
|
54
|
+
# Case: lookup by accession (only by root).
|
55
|
+
return Portal.LOOKUP_ROOT, ref_validator
|
56
|
+
elif schema_property_info_submitted_id := schema_properties.get("submitted_id"):
|
57
|
+
if schema_property_pattern_submitted_id := schema_property_info_submitted_id.get("pattern"):
|
58
|
+
if re.match(schema_property_pattern_submitted_id, value):
|
59
|
+
# Case: lookup by submitted_id (only by specified type).
|
60
|
+
return Portal.LOOKUP_SPECIFIED_TYPE, ref_validator
|
61
|
+
return DEFAULT_RESPONSE
|
62
|
+
|
63
|
+
|
64
|
+
# This is here for now because of problems with circular dependencies.
|
65
|
+
# See: smaht-portal/.../schema_formats.py
|
66
|
+
def _is_accession_id(value: str) -> bool:
|
67
|
+
return isinstance(value, str) and re.match(r"^SMA[1-9A-Z]{9}$", value) is not None
|
@@ -46,7 +46,7 @@ dcicutils/log_utils.py,sha256=7pWMc6vyrorUZQf-V-M3YC6zrPgNhuV_fzm9xqTPph0,10883
|
|
46
46
|
dcicutils/misc_utils.py,sha256=zVc4urdVGgnWjQ4UQlrGH-URAzr2l_PwZWI3u_GJdFE,102210
|
47
47
|
dcicutils/obfuscation_utils.py,sha256=fo2jOmDRC6xWpYX49u80bVNisqRRoPskFNX3ymFAmjw,5963
|
48
48
|
dcicutils/opensearch_utils.py,sha256=V2exmFYW8Xl2_pGFixF4I2Cc549Opwe4PhFi5twC0M8,1017
|
49
|
-
dcicutils/portal_object_utils.py,sha256=
|
49
|
+
dcicutils/portal_object_utils.py,sha256=gDXRgPsRvqCFwbC8WatsuflAxNiigOnqr0Hi93k3AgE,15422
|
50
50
|
dcicutils/portal_utils.py,sha256=oBoI3KWRp6YrbsuVGbmPQ3kATB5cVVsQo7-qmnYXWqg,30260
|
51
51
|
dcicutils/project_utils.py,sha256=qPdCaFmWUVBJw4rw342iUytwdQC0P-XKpK4mhyIulMM,31250
|
52
52
|
dcicutils/qa_checkers.py,sha256=cdXjeL0jCDFDLT8VR8Px78aS10hwNISOO5G_Zv2TZ6M,20534
|
@@ -62,16 +62,17 @@ dcicutils/secrets_utils.py,sha256=8dppXAsiHhJzI6NmOcvJV5ldvKkQZzh3Fl-cb8Wm7MI,19
|
|
62
62
|
dcicutils/sheet_utils.py,sha256=VlmzteONW5VF_Q4vo0yA5vesz1ViUah1MZ_yA1rwZ0M,33629
|
63
63
|
dcicutils/snapshot_utils.py,sha256=ymP7PXH6-yEiXAt75w0ldQFciGNqWBClNxC5gfX2FnY,22961
|
64
64
|
dcicutils/ssl_certificate_utils.py,sha256=F0ifz_wnRRN9dfrfsz7aCp4UDLgHEY8LaK7PjnNvrAQ,9707
|
65
|
-
dcicutils/structured_data.py,sha256=
|
65
|
+
dcicutils/structured_data.py,sha256=IjiLOLsxtINOEaz3oVSEscA4lW-t6u9dFfW-NRCRmfs,58451
|
66
66
|
dcicutils/submitr/progress_constants.py,sha256=5bxyX77ql8qEJearfHEvsvXl7D0GuUODW0T65mbRmnE,2895
|
67
|
+
dcicutils/submitr/ref_lookup_strategy.py,sha256=Js2cVznTmgjciLWBPLCvMiwLIHXjDn3jww-gJPjYuFw,3467
|
67
68
|
dcicutils/task_utils.py,sha256=MF8ujmTD6-O2AC2gRGPHyGdUrVKgtr8epT5XU8WtNjk,8082
|
68
69
|
dcicutils/tmpfile_utils.py,sha256=n95XF8dZVbQRSXBZTGToXXfSs3JUVRyN6c3ZZ0nhAWI,1403
|
69
70
|
dcicutils/trace_utils.py,sha256=g8kwV4ebEy5kXW6oOrEAUsurBcCROvwtZqz9fczsGRE,1769
|
70
71
|
dcicutils/validation_utils.py,sha256=cMZIU2cY98FYtzK52z5WUYck7urH6JcqOuz9jkXpqzg,14797
|
71
72
|
dcicutils/variant_utils.py,sha256=2H9azNx3xAj-MySg-uZ2SFqbWs4kZvf61JnK6b-h4Qw,4343
|
72
73
|
dcicutils/zip_utils.py,sha256=rnjNv_k6L9jT2SjDSgVXp4BEJYLtz9XN6Cl2Fy-tqnM,2027
|
73
|
-
dcicutils-8.8.1.
|
74
|
-
dcicutils-8.8.1.
|
75
|
-
dcicutils-8.8.1.
|
76
|
-
dcicutils-8.8.1.
|
77
|
-
dcicutils-8.8.1.
|
74
|
+
dcicutils-8.8.1.1b28.dist-info/LICENSE.txt,sha256=qnwSmfnEWMl5l78VPDEzAmEbLVrRqQvfUQiHT0ehrOo,1102
|
75
|
+
dcicutils-8.8.1.1b28.dist-info/METADATA,sha256=BQjxloCg_4ksew6yyy1O5C9CSZ8VUTQrsqgfq1_K9D4,3357
|
76
|
+
dcicutils-8.8.1.1b28.dist-info/WHEEL,sha256=7Z8_27uaHI_UZAc4Uox4PpBhQ9Y5_modZXWMxtUi4NU,88
|
77
|
+
dcicutils-8.8.1.1b28.dist-info/entry_points.txt,sha256=51Q4F_2V10L0282W7HFjP4jdzW4K8lnWDARJQVFy_hw,270
|
78
|
+
dcicutils-8.8.1.1b28.dist-info/RECORD,,
|
File without changes
|
File without changes
|
File without changes
|