dcicutils 8.8.5__py3-none-any.whl → 8.8.6.1b1__py3-none-any.whl

Sign up to get free protection for your applications and to get access to all the features.
dcicutils/ff_utils.py CHANGED
@@ -895,9 +895,12 @@ def _get_es_metadata(uuids, es_client, filters, sources, chunk_size, auth):
895
895
  used to create the generator.
896
896
  Should NOT be used directly
897
897
  """
898
+ def get_es_host_local() -> Optional[str]:
899
+ return os.environ.get("ES_HOST_LOCAL", None)
898
900
  health = get_health_page(key=auth)
899
901
  if es_client is None:
900
- es_url = health['elasticsearch']
902
+ if not (es_url := get_es_host_local()):
903
+ es_url = health['elasticsearch']
901
904
  es_client = es_utils.create_es_client(es_url, use_aws_auth=True)
902
905
  namespace_star = health.get('namespace', '') + '*'
903
906
  # match all given uuids to _id fields
dcicutils/file_utils.py CHANGED
@@ -1,13 +1,23 @@
1
1
  import glob
2
+ import hashlib
3
+ import io
2
4
  import os
3
5
  import pathlib
6
+ from datetime import datetime
7
+ import random
8
+ import string
9
+ from tempfile import gettempdir as get_temporary_directory
4
10
  from typing import List, Optional, Union
11
+ from uuid import uuid4 as uuid
12
+
13
+ HOME_DIRECTORY = str(pathlib.Path().home())
5
14
 
6
15
 
7
16
  def search_for_file(file: str,
8
- location: Union[str, Optional[List[str]]] = None,
17
+ location: Union[str, pathlib.PosixPath, Optional[List[Union[str, pathlib.PosixPath]]]] = None,
9
18
  recursive: bool = False,
10
- single: bool = False) -> Union[List[str], Optional[str]]:
19
+ single: bool = False,
20
+ order: bool = True) -> Union[List[str], Optional[str]]:
11
21
  """
12
22
  Searches for the existence of the given file name, first directly in the given directory or list
13
23
  of directories, if specified, and if not then just in the current (working) directory; if the
@@ -16,43 +26,242 @@ def search_for_file(file: str,
16
26
  first file which is found is returns (as a string), or None if none; if the single flag
17
27
  is False, then all matched files are returned in a list, or and empty list if none.
18
28
  """
19
- if file and isinstance(file, (str, pathlib.PosixPath)):
20
- if os.path.isabs(file):
21
- if os.path.exists(file):
22
- return file if single else [file]
23
- return None if single else []
24
- files_found = []
25
- if not location:
26
- location = ["."]
27
- elif isinstance(location, (str, pathlib.PosixPath)):
28
- location = [location]
29
- elif not isinstance(location, list):
30
- location = []
31
- for directory in location:
32
- if not directory:
29
+ def order_by_fewest_number_of_paths_and_then_alphabetically(paths: List[str]) -> List[str]:
30
+ def order_by(path: str):
31
+ return len(path.split(os.path.sep)), path
32
+ return sorted(paths, key=order_by)
33
+
34
+ if not (file and isinstance(file, (str, pathlib.PosixPath))):
35
+ return None if single is True else []
36
+ if os.path.isabs(file):
37
+ if os.path.exists(file):
38
+ return str(file) if single is True else [str(file)]
39
+ return None if single is True else []
40
+ files_found = []
41
+ if not location:
42
+ location = ["."]
43
+ elif isinstance(location, (str, pathlib.PosixPath)):
44
+ location = [location]
45
+ elif not isinstance(location, list):
46
+ location = []
47
+ location_pruned = []
48
+ for directory in location:
49
+ if not isinstance(directory, str):
50
+ if not isinstance(directory, pathlib.PosixPath):
51
+ continue
52
+ directory = str(directory)
53
+ if not (directory := directory.strip()):
54
+ continue
55
+ if os.path.isfile(directory := os.path.abspath(os.path.normpath(directory))):
56
+ # Actually, allow a file rather then a directory; assume its parent directory was intended.
57
+ if not (directory := os.path.dirname(directory)):
33
58
  continue
34
- if isinstance(directory, (str, pathlib.PosixPath)) and os.path.exists(os.path.join(directory, file)):
35
- file_found = os.path.abspath(os.path.normpath(os.path.join(directory, file)))
36
- if single:
37
- return file_found
38
- if file_found not in files_found:
39
- files_found.append(file_found)
40
- if recursive:
41
- for directory in location:
42
- if not directory:
43
- continue
44
- if not directory.endswith("/**") and not file.startswith("**/"):
45
- path = f"{directory}/**/{file}"
46
- else:
47
- path = f"{directory}/{file}"
48
- files = glob.glob(path, recursive=recursive)
49
- if files:
50
- for file_found in files:
51
- file_found = os.path.abspath(file_found)
52
- if single:
53
- return file_found
54
- if file_found not in files_found:
55
- files_found.append(file_found)
56
- if files_found:
57
- return files_found[0] if single else files_found
58
- return None if single else []
59
+ if directory not in location_pruned:
60
+ location_pruned.append(directory)
61
+ location = location_pruned
62
+ for directory in location:
63
+ if os.path.exists(os.path.join(directory, file)):
64
+ file_found = os.path.abspath(os.path.normpath(os.path.join(directory, file)))
65
+ if single is True:
66
+ return file_found
67
+ if file_found not in files_found:
68
+ files_found.append(file_found)
69
+ if recursive is True:
70
+ for directory in location:
71
+ if not directory.endswith("/**") and not file.startswith("**/"):
72
+ path = f"{directory}/**/{file}"
73
+ else:
74
+ path = f"{directory}/{file}"
75
+ files = glob.glob(path, recursive=True if recursive is True else False)
76
+ if files:
77
+ for file_found in files:
78
+ file_found = os.path.abspath(file_found)
79
+ if single is True:
80
+ return file_found
81
+ if file_found not in files_found:
82
+ files_found.append(file_found)
83
+ if single is True:
84
+ return files_found[0] if files_found else None
85
+ elif order is True:
86
+ return order_by_fewest_number_of_paths_and_then_alphabetically(files_found)
87
+ else:
88
+ return files_found
89
+
90
+
91
+ def normalize_path(value: Union[str, pathlib.Path], absolute: bool = False, expand_home: Optional[bool] = None) -> str:
92
+ """
93
+ Normalizes the given path value and returns the result; does things like remove redundant
94
+ consecutive directory separators and redundant parent paths. If the given absolute argument
95
+ is True than converts the path to an absolute path. If the given expand_home argument is False
96
+ and if the path can reasonably be represented with a home directory indicator (i.e. "~"), then
97
+ converts it to such. If the expand_home argument is True and path starts with the home directory
98
+ indicator (i.e. "~") then expands it to the actual (absolute) home path of the caller. If the
99
+ given path value is not actually even a string (or pathlib.Path) then returns an empty string.
100
+ """
101
+ if isinstance(value, pathlib.Path):
102
+ value = str(value)
103
+ elif not isinstance(value, str):
104
+ return ""
105
+ if not (value := value.strip()) or not (value := os.path.normpath(value)):
106
+ return ""
107
+ if expand_home is True:
108
+ value = os.path.expanduser(value)
109
+ elif (expand_home is False) and (os.name == "posix"):
110
+ if value.startswith(home := HOME_DIRECTORY + os.sep):
111
+ value = "~/" + value[len(home):]
112
+ elif value == HOME_DIRECTORY:
113
+ value = "~"
114
+ if absolute is True:
115
+ value = os.path.abspath(value)
116
+ return value
117
+
118
+
119
+ def get_file_size(file: str, raise_exception: bool = True) -> Optional[int]:
120
+ try:
121
+ return os.path.getsize(file) if isinstance(file, str) else None
122
+ except Exception:
123
+ if raise_exception is True:
124
+ raise
125
+ return None
126
+
127
+
128
+ def get_file_modified_datetime(file: str, raise_exception: bool = True) -> Optional[datetime]:
129
+ try:
130
+ return datetime.fromtimestamp(os.path.getmtime(file)) if isinstance(file, str) else None
131
+ except Exception:
132
+ if raise_exception is True:
133
+ raise
134
+ return None
135
+
136
+
137
+ def are_files_equal(filea: str, fileb: str, raise_exception: bool = True) -> bool:
138
+ """
139
+ Returns True iff the contents of the two given files are exactly the same.
140
+ """
141
+ try:
142
+ with open(filea, "rb") as fa:
143
+ with open(fileb, "rb") as fb:
144
+ chunk_size = 4096
145
+ while True:
146
+ chunka = fa.read(chunk_size)
147
+ chunkb = fb.read(chunk_size)
148
+ if chunka != chunkb:
149
+ return False
150
+ if not chunka:
151
+ break
152
+ return True
153
+ except Exception:
154
+ if raise_exception is True:
155
+ raise
156
+ return False
157
+
158
+
159
+ def compute_file_md5(file: str, raise_exception: bool = True) -> str:
160
+ """
161
+ Returns the md5 checksum for the given file.
162
+ """
163
+ if not isinstance(file, str):
164
+ return ""
165
+ try:
166
+ md5 = hashlib.md5()
167
+ with open(file, "rb") as file:
168
+ for chunk in iter(lambda: file.read(4096), b""):
169
+ md5.update(chunk)
170
+ return md5.hexdigest()
171
+ except Exception:
172
+ if raise_exception is True:
173
+ raise
174
+ return ""
175
+
176
+
177
+ def compute_file_etag(file: str, raise_exception: bool = True) -> Optional[str]:
178
+ """
179
+ Returns the AWS S3 "etag" for the given file; this value is md5-like but
180
+ not the same as a normal md5. We use this to compare that a file in S3
181
+ appears to be the exact the same file as a local file.
182
+ """
183
+ try:
184
+ with io.open(file, "rb") as f:
185
+ return _compute_file_etag(f)
186
+ except Exception:
187
+ if raise_exception is True:
188
+ raise
189
+ return None
190
+
191
+
192
+ def _compute_file_etag(f: io.BufferedReader) -> str:
193
+ # See: https://stackoverflow.com/questions/75723647/calculate-md5-from-aws-s3-etag
194
+ MULTIPART_THRESHOLD = 8388608
195
+ MULTIPART_CHUNKSIZE = 8388608
196
+ # BUFFER_SIZE = 1048576
197
+ # Verify some assumptions are correct
198
+ # assert(MULTIPART_CHUNKSIZE >= MULTIPART_THRESHOLD)
199
+ # assert((MULTIPART_THRESHOLD % BUFFER_SIZE) == 0)
200
+ # assert((MULTIPART_CHUNKSIZE % BUFFER_SIZE) == 0)
201
+ hash = hashlib.md5()
202
+ read = 0
203
+ chunks = None
204
+ while True:
205
+ # Read some from stdin, if we're at the end, stop reading
206
+ bits = f.read(1048576)
207
+ if len(bits) == 0:
208
+ break
209
+ read += len(bits)
210
+ hash.update(bits)
211
+ if chunks is None:
212
+ # We're handling a multi-part upload, so switch to calculating
213
+ # hashes of each chunk
214
+ if read >= MULTIPART_THRESHOLD:
215
+ chunks = b''
216
+ if chunks is not None:
217
+ if (read % MULTIPART_CHUNKSIZE) == 0:
218
+ # Dont with a chunk, add it to the list of hashes to hash later
219
+ chunks += hash.digest()
220
+ hash = hashlib.md5()
221
+ if chunks is None:
222
+ # Normal upload, just output the MD5 hash
223
+ etag = hash.hexdigest()
224
+ else:
225
+ # Multipart upload, need to output the hash of the hashes
226
+ if (read % MULTIPART_CHUNKSIZE) != 0:
227
+ # Add the last part if we have a partial chunk
228
+ chunks += hash.digest()
229
+ etag = hashlib.md5(chunks).hexdigest() + "-" + str(len(chunks) // 16)
230
+ return etag
231
+
232
+
233
+ def create_random_file(file: Optional[str] = None, prefix: Optional[str] = None, suffix: Optional[str] = None,
234
+ nbytes: int = 1024, binary: bool = False, line_length: Optional[int] = None) -> str:
235
+ """
236
+ Write to the given file (name/path) some random content. If the given file is None then writes
237
+ to a temporary file. In either case, returns the file written to. The of bytes written is 1024
238
+ by default be can be specified with the nbytes argument; default to writing ASCII text but if
239
+ the binary argument is True then writes binary data as well; if not binary the content is in
240
+ lines of 80 characters each; use the line_length argumetn in this case to change the line length.
241
+ """
242
+ if not isinstance(nbytes, int) or nbytes < 0:
243
+ nbytes = 0
244
+ if not isinstance(file, str) or not file:
245
+ if not isinstance(prefix, str):
246
+ prefix = ""
247
+ if not isinstance(suffix, str):
248
+ suffix = ""
249
+ file = f"{datetime.utcnow().strftime('%Y%m%d%H%M%S')}{str(uuid()).replace('-', '')}"
250
+ file = os.path.join(get_temporary_directory(), file)
251
+ with open(file, "wb" if binary is True else "w") as f:
252
+ if binary is True:
253
+ f.write(os.urandom(nbytes))
254
+ else:
255
+ if (not isinstance(line_length, int)) or (line_length < 1):
256
+ line_length = 80
257
+ line_length += 1
258
+ nlines = nbytes // line_length
259
+ nremainder = nbytes % line_length
260
+ for n in range(nlines):
261
+ f.write("".join(random.choices(string.ascii_letters + string.digits, k=line_length - 1)))
262
+ f.write("\n")
263
+ if nremainder > 1:
264
+ f.write("".join(random.choices(string.ascii_letters + string.digits, k=nremainder - 1)))
265
+ if nremainder > 0:
266
+ f.write("\n")
267
+ return file
@@ -0,0 +1,39 @@
1
+ from contextlib import contextmanager
2
+ import requests
3
+ from typing import Callable, Optional
4
+ from dcicutils.tmpfile_utils import temporary_file
5
+
6
+
7
+ @contextmanager
8
+ def download(url: str, suffix: Optional[str] = None, binary: bool = True,
9
+ progress: Optional[Callable] = None) -> Optional[str]:
10
+ """
11
+ Context manager to download the given URL into a temporary file and yields the file
12
+ path to it. An optional file suffix may be specified for this temporary file name.
13
+ Defaults to binary file mode; if not desired then pass False as the binary argument.
14
+ """
15
+ with temporary_file(suffix=suffix) as file:
16
+ download_to(url, file, binary=binary, progress=progress)
17
+ yield file
18
+
19
+
20
+ def download_to(url: str, file: str, binary: bool = True, progress: Optional[Callable] = None) -> None:
21
+ """
22
+ Download the given URL into the given file. Defaults to binary
23
+ file mode; if not desired then pass False as the binary argument.
24
+ """
25
+ if not callable(progress):
26
+ progress = None
27
+ response = requests.get(url, stream=True)
28
+ if progress:
29
+ nbytes = 0
30
+ nbytes_total = None
31
+ if isinstance(content_length := response.headers.get("Content-Length"), str) and content_length.isdigit():
32
+ nbytes_total = int(content_length)
33
+ with open(file, "wb" if binary is True else "w") as f:
34
+ for chunk in response.iter_content(chunk_size=8192):
35
+ if chunk:
36
+ f.write(chunk)
37
+ if progress:
38
+ nbytes += len(chunk)
39
+ progress(nbytes, nbytes_total)
dcicutils/misc_utils.py CHANGED
@@ -3,6 +3,7 @@ This file contains functions that might be generally useful.
3
3
  """
4
4
 
5
5
  from collections import namedtuple
6
+ import appdirs
6
7
  import contextlib
7
8
  import datetime
8
9
  import functools
@@ -13,10 +14,12 @@ import json
13
14
  import logging
14
15
  import math
15
16
  import os
17
+ import platform
16
18
  import pytz
17
19
  import re
18
20
  import rfc3986.validators
19
21
  import rfc3986.exceptions
22
+ import shortuuid
20
23
  import time
21
24
  import uuid
22
25
  import warnings
@@ -1152,7 +1155,8 @@ def remove_suffix(suffix: str, text: str, required: bool = False):
1152
1155
 
1153
1156
  def remove_empty_properties(data: Optional[Union[list, dict]],
1154
1157
  isempty: Optional[Callable] = None,
1155
- isempty_array_element: Optional[Callable] = None) -> None:
1158
+ isempty_array_element: Optional[Callable] = None,
1159
+ raise_exception_on_nonempty_array_element_after_empty: bool = False) -> None:
1156
1160
  def _isempty(value: Any) -> bool: # noqa
1157
1161
  return isempty(value) if callable(isempty) else value in [None, "", {}, []]
1158
1162
  if isinstance(data, dict):
@@ -1160,11 +1164,22 @@ def remove_empty_properties(data: Optional[Union[list, dict]],
1160
1164
  if _isempty(value := data[key]):
1161
1165
  del data[key]
1162
1166
  else:
1163
- remove_empty_properties(value, isempty=isempty, isempty_array_element=isempty_array_element)
1167
+ remove_empty_properties(value, isempty=isempty, isempty_array_element=isempty_array_element,
1168
+ raise_exception_on_nonempty_array_element_after_empty= # noqa
1169
+ raise_exception_on_nonempty_array_element_after_empty)
1164
1170
  elif isinstance(data, list):
1165
1171
  for item in data:
1166
- remove_empty_properties(item, isempty=isempty, isempty_array_element=isempty_array_element)
1172
+ remove_empty_properties(item, isempty=isempty, isempty_array_element=isempty_array_element,
1173
+ raise_exception_on_nonempty_array_element_after_empty= # noqa
1174
+ raise_exception_on_nonempty_array_element_after_empty)
1167
1175
  if callable(isempty_array_element):
1176
+ if raise_exception_on_nonempty_array_element_after_empty is True:
1177
+ empty_element_seen = False
1178
+ for item in data:
1179
+ if not empty_element_seen and isempty_array_element(item):
1180
+ empty_element_seen = True
1181
+ elif empty_element_seen and not isempty_array_element(item):
1182
+ raise Exception("Non-empty element found after empty element.")
1168
1183
  data[:] = [item for item in data if not isempty_array_element(item)]
1169
1184
 
1170
1185
 
@@ -1522,7 +1537,7 @@ def right_trim(list_or_tuple: Union[List[Any], Tuple[Any]],
1522
1537
  def create_dict(**kwargs) -> dict:
1523
1538
  result = {}
1524
1539
  for name in kwargs:
1525
- if kwargs[name]:
1540
+ if not (kwargs[name] is None):
1526
1541
  result[name] = kwargs[name]
1527
1542
  return result
1528
1543
 
@@ -2548,6 +2563,19 @@ def normalize_spaces(value: str) -> str:
2548
2563
  return re.sub(r"\s+", " ", value).strip()
2549
2564
 
2550
2565
 
2566
+ def normalize_string(value: Optional[str]) -> Optional[str]:
2567
+ """
2568
+ Strips leading/trailing spaces, and converts multiple consecutive spaces to a single space
2569
+ in the given string value and returns the result. If the given value is None returns an
2570
+ empty string. If the given value is not actually even a string then return None.
2571
+ """
2572
+ if value is None:
2573
+ return ""
2574
+ elif isinstance(value, str):
2575
+ return re.sub(r"\s+", " ", value).strip()
2576
+ return None
2577
+
2578
+
2551
2579
  def find_nth_from_end(string: str, substring: str, nth: int) -> int:
2552
2580
  """
2553
2581
  Returns the index of the nth occurrence of the given substring within
@@ -2590,7 +2618,11 @@ def format_size(nbytes: Union[int, float], precision: int = 2, nospace: bool = F
2590
2618
  nbytes = int(nbytes)
2591
2619
  return f"{nbytes} byte{'s' if nbytes != 1 else ''}"
2592
2620
  unit = (UNITS_TERSE if terse else UNITS)[index]
2593
- return f"{nbytes:.{precision}f}{'' if nospace else ' '}{unit}"
2621
+ size = f"{nbytes:.{precision}f}"
2622
+ if size.endswith(f".{'0' * precision}"):
2623
+ # Tidy up extraneous zeros.
2624
+ size = size[:-(precision - 1)]
2625
+ return f"{size}{'' if nospace else ' '}{unit}"
2594
2626
 
2595
2627
 
2596
2628
  def format_duration(seconds: Union[int, float]) -> str:
@@ -2670,3 +2702,48 @@ class JsonLinesReader:
2670
2702
  yield line
2671
2703
  else:
2672
2704
  raise Exception(f"If the first line is not a list, all lines must be dictionaries: {line!r}")
2705
+
2706
+
2707
+ def get_app_specific_directory() -> str:
2708
+ """
2709
+ Returns the standard system application specific directory:
2710
+ - On MacOS this directory: is: ~/Library/Application Support
2711
+ - On Linux this directory is: ~/.local/share
2712
+ - On Windows this directory is: %USERPROFILE%\\AppData\\Local # noqa
2713
+ N.B. This is has been tested on MacOS and Linux but not on Windows.
2714
+ """
2715
+ return appdirs.user_data_dir()
2716
+
2717
+
2718
+ def get_os_name() -> str:
2719
+ if os_name := platform.system():
2720
+ if os_name == "Darwin": return "osx" # noqa
2721
+ elif os_name == "Linux": return "linux" # noqa
2722
+ elif os_name == "Windows": return "windows" # noqa
2723
+ return ""
2724
+
2725
+
2726
+ def get_cpu_architecture_name() -> str:
2727
+ if os_architecture_name := platform.machine():
2728
+ if os_architecture_name == "x86_64": return "amd64" # noqa
2729
+ return os_architecture_name
2730
+ return ""
2731
+
2732
+
2733
+ def create_uuid(nodash: bool = False, upper: bool = False) -> str:
2734
+ value = str(uuid.uuid4())
2735
+ if nodash is True:
2736
+ value = value.replace("-", "")
2737
+ if upper is True:
2738
+ value = value.upper()
2739
+ return value
2740
+
2741
+
2742
+ def create_short_uuid(length: Optional[int] = None, upper: bool = False):
2743
+ # Not really techincally a uuid of course.
2744
+ if (length is None) or (not isinstance(length, int)) or (length < 1):
2745
+ length = 16
2746
+ value = shortuuid.ShortUUID().random(length=length)
2747
+ if upper is True:
2748
+ value = value.upper()
2749
+ return value
dcicutils/portal_utils.py CHANGED
@@ -1,5 +1,6 @@
1
1
  from collections import deque
2
2
  from functools import lru_cache
3
+ from dcicutils.function_cache_decorator import function_cache
3
4
  import io
4
5
  import json
5
6
  from pyramid.config import Configurator as PyramidConfigurator
@@ -18,6 +19,7 @@ from wsgiref.simple_server import make_server as wsgi_make_server
18
19
  from dcicutils.common import APP_SMAHT, OrchestratedApp, ORCHESTRATED_APPS
19
20
  from dcicutils.ff_utils import get_metadata, get_schema, patch_metadata, post_metadata
20
21
  from dcicutils.misc_utils import to_camel_case, VirtualApp
22
+ from dcicutils.schema_utils import get_identifying_properties
21
23
  from dcicutils.tmpfile_utils import temporary_file
22
24
 
23
25
  Portal = Type["Portal"] # Forward type reference for type hints.
@@ -441,6 +443,54 @@ class Portal:
441
443
  result_kwargs["timeout"] = timeout
442
444
  return result_kwargs
443
445
 
446
+ @function_cache(maxsize=100, serialize_key=True)
447
+ def get_identifying_paths(self, portal_object: dict, portal_type: Optional[str] = None) -> List[str]:
448
+ """
449
+ Returns the list of the identifying Portal (URL) paths for the given Portal object. Favors any
450
+ uuid based path and defavors aliases based paths (ala self.get_identifying_property_names);
451
+ no other ordering defined. Returns empty list of none or otherwise not found.
452
+ """
453
+ results = []
454
+ if not isinstance(portal_object, dict):
455
+ return results
456
+ if not isinstance(portal_type, str) or not portal_type:
457
+ if not (portal_type := self.get_schema_type(portal_object)):
458
+ return results
459
+ for identifying_property in self.get_identifying_property_names(portal_type):
460
+ if identifying_value := portal_object.get(identifying_property):
461
+ if isinstance(identifying_value, list):
462
+ for identifying_value_item in identifying_value:
463
+ results.append(f"/{portal_type}/{identifying_value_item}")
464
+ elif identifying_property == "uuid":
465
+ results.append(f"/{identifying_value}")
466
+ else:
467
+ results.append(f"/{portal_type}/{identifying_value}")
468
+ return results
469
+
470
+ @function_cache(maxsize=100, serialize_key=True)
471
+ def get_identifying_property_names(self, schema: Union[str, dict]) -> List[str]:
472
+ """
473
+ Returns the list of identifying property names for the given Portal schema, which may
474
+ be either a schema name or a schema object; empty list of none or otherwise not found.
475
+ """
476
+ results = []
477
+ if isinstance(schema, str):
478
+ try:
479
+ if not (schema := self.get_schema(schema)):
480
+ return results
481
+ except Exception:
482
+ return results
483
+ elif not isinstance(schema, dict):
484
+ return results
485
+ if not (identifying_properties := get_identifying_properties(schema)):
486
+ return results
487
+ identifying_properties = [*identifying_properties]
488
+ for favored_identifying_property in reversed(["uuid", "identifier"]):
489
+ if favored_identifying_property in identifying_properties:
490
+ identifying_properties.remove(favored_identifying_property)
491
+ identifying_properties.insert(0, favored_identifying_property)
492
+ return identifying_properties
493
+
444
494
  @staticmethod
445
495
  def _default_keys_file(app: Optional[str], env: Optional[str], server: Optional[str]) -> Optional[str]:
446
496
  def infer_app_from_env(env: str) -> Optional[str]: # noqa
@@ -57,6 +57,7 @@
57
57
 
58
58
  import argparse
59
59
  from functools import lru_cache
60
+ import io
60
61
  import json
61
62
  import pyperclip
62
63
  import os
@@ -97,11 +98,18 @@ def main():
97
98
  help="Include all properties for schema usage.")
98
99
  parser.add_argument("--raw", action="store_true", required=False, default=False, help="Raw output.")
99
100
  parser.add_argument("--tree", action="store_true", required=False, default=False, help="Tree output for schemas.")
101
+ parser.add_argument("--post", type=str, required=False, default=None,
102
+ help="POST data of the main arg type with data from file specified with this option.")
103
+ parser.add_argument("--patch", type=str, required=False, default=None,
104
+ help="PATCH data of the main arg type with data from file specified with this option.")
100
105
  parser.add_argument("--database", action="store_true", required=False, default=False,
101
106
  help="Read from database output.")
107
+ parser.add_argument("--bool", action="store_true", required=False,
108
+ default=False, help="Only return whether found or not.")
102
109
  parser.add_argument("--yaml", action="store_true", required=False, default=False, help="YAML output.")
103
110
  parser.add_argument("--copy", "-c", action="store_true", required=False, default=False,
104
111
  help="Copy object data to clipboard.")
112
+ parser.add_argument("--indent", required=False, default=False, help="Indent output.", type=int)
105
113
  parser.add_argument("--details", action="store_true", required=False, default=False, help="Detailed output.")
106
114
  parser.add_argument("--more-details", action="store_true", required=False, default=False,
107
115
  help="More detailed output.")
@@ -151,6 +159,18 @@ def main():
151
159
  args.schema = True
152
160
 
153
161
  if args.schema:
162
+ if args.post:
163
+ if post_data := _read_json_from_file(args.post):
164
+ if args.verbose:
165
+ _print(f"POSTing data from file ({args.post}) as type: {args.uuid}")
166
+ if isinstance(post_data, dict):
167
+ post_data = [post_data]
168
+ elif not isinstance(post_data, list):
169
+ _print(f"POST data neither list nor dictionary: {args.post}")
170
+ for item in post_data:
171
+ portal.post_metadata(args.uuid, item)
172
+ if args.verbose:
173
+ _print(f"Done POSTing data from file ({args.post}) as type: {args.uuid}")
154
174
  schema, schema_name = _get_schema(portal, args.uuid)
155
175
  if schema:
156
176
  if args.copy:
@@ -166,14 +186,50 @@ def main():
166
186
  _print_schema(schema, details=args.details, more_details=args.details,
167
187
  all=args.all, raw=args.raw, raw_yaml=args.yaml)
168
188
  return
169
-
170
- data = _get_portal_object(portal=portal, uuid=args.uuid, raw=args.raw, database=args.database, verbose=args.verbose)
189
+ elif args.patch:
190
+ if patch_data := _read_json_from_file(args.patch):
191
+ if args.verbose:
192
+ _print(f"PATCHing data from file ({args.patch}) for object: {args.uuid}")
193
+ if isinstance(patch_data, dict):
194
+ patch_data = [patch_data]
195
+ elif not isinstance(patch_data, list):
196
+ _print(f"PATCH data neither list nor dictionary: {args.patch}")
197
+ for item in patch_data:
198
+ portal.patch_metadata(args.uuid, item)
199
+ if args.verbose:
200
+ _print(f"Done PATCHing data from file ({args.patch}) as type: {args.uuid}")
201
+ return
202
+ else:
203
+ _print(f"No PATCH data found in file: {args.patch}")
204
+ exit(1)
205
+
206
+ data = _get_portal_object(portal=portal, uuid=args.uuid, raw=args.raw,
207
+ database=args.database, check=args.bool, verbose=args.verbose)
208
+ if args.bool:
209
+ if data:
210
+ _print(f"{args.uuid}: found")
211
+ exit(0)
212
+ else:
213
+ _print(f"{args.uuid}: not found")
214
+ exit(1)
171
215
  if args.copy:
172
216
  pyperclip.copy(json.dumps(data, indent=4))
173
217
  if args.yaml:
174
218
  _print(yaml.dump(data))
175
219
  else:
176
- _print(json.dumps(data, default=str, indent=4))
220
+ if args.indent > 0:
221
+ _print(_format_json_with_indent(data, indent=args.indent))
222
+ else:
223
+ _print(json.dumps(data, default=str, indent=4))
224
+
225
+
226
+ def _format_json_with_indent(value: dict, indent: int = 0) -> Optional[str]:
227
+ if isinstance(value, dict):
228
+ result = json.dumps(value, indent=4)
229
+ if indent > 0:
230
+ result = f"{indent * ' '}{result}"
231
+ result = result.replace("\n", f"\n{indent * ' '}")
232
+ return result
177
233
 
178
234
 
179
235
  def _create_portal(ini: str, env: Optional[str] = None,
@@ -198,7 +254,8 @@ def _create_portal(ini: str, env: Optional[str] = None,
198
254
 
199
255
 
200
256
  def _get_portal_object(portal: Portal, uuid: str,
201
- raw: bool = False, database: bool = False, verbose: bool = False) -> dict:
257
+ raw: bool = False, database: bool = False,
258
+ check: bool = False, verbose: bool = False) -> dict:
202
259
  response = None
203
260
  try:
204
261
  if not uuid.startswith("/"):
@@ -212,13 +269,18 @@ def _get_portal_object(portal: Portal, uuid: str,
212
269
  _exit()
213
270
  _exit(f"Exception getting Portal object from {portal.server}: {uuid}\n{get_error_message(e)}")
214
271
  if not response:
272
+ if check:
273
+ return None
215
274
  _exit(f"Null response getting Portal object from {portal.server}: {uuid}")
216
275
  if response.status_code not in [200, 307]:
217
276
  # TODO: Understand why the /me endpoint returns HTTP status code 307, which is only why we mention it above.
218
277
  _exit(f"Invalid status code ({response.status_code}) getting Portal object from {portal.server}: {uuid}")
219
278
  if not response.json:
220
279
  _exit(f"Invalid JSON getting Portal object: {uuid}")
221
- return response.json()
280
+ response = response.json()
281
+ if raw:
282
+ response.pop("schema_version", None)
283
+ return response
222
284
 
223
285
 
224
286
  @lru_cache(maxsize=1)
@@ -257,6 +319,7 @@ def _print_schema_info(schema: dict, level: int = 0,
257
319
  required: Optional[List[str]] = None) -> None:
258
320
  if not schema or not isinstance(schema, dict):
259
321
  return
322
+ identifying_properties = schema.get("identifyingProperties")
260
323
  if level == 0:
261
324
  if required_properties := schema.get("required"):
262
325
  _print("- required properties:")
@@ -383,6 +446,8 @@ def _print_schema_info(schema: dict, level: int = 0,
383
446
  suffix += f" | enum"
384
447
  if property_required:
385
448
  suffix += f" | required"
449
+ if property_name in (identifying_properties or []):
450
+ suffix += f" | identifying"
386
451
  if property.get("uniqueKey"):
387
452
  suffix += f" | unique"
388
453
  if pattern := property.get("pattern"):
@@ -529,6 +594,23 @@ def _print_tree(root_name: Optional[str],
529
594
  print(line)
530
595
 
531
596
 
597
+ def _read_json_from_file(file: str) -> Optional[dict]:
598
+ if not os.path.exists(file):
599
+ _print(f"Cannot find file: {file}")
600
+ exit(1)
601
+ try:
602
+ with io.open(file, "r") as f:
603
+ try:
604
+ return json.load(f)
605
+ except Exception:
606
+ _print(f"Cannot parse JSON in file: {file}")
607
+ exit(1)
608
+ except Exception as e:
609
+ print(e)
610
+ _print(f"Cannot open file: {file}")
611
+ exit(1)
612
+
613
+
532
614
  def _print(*args, **kwargs):
533
615
  with uncaptured_output():
534
616
  PRINT(*args, **kwargs)
@@ -53,9 +53,10 @@ class StructuredDataSet:
53
53
  def __init__(self, file: Optional[str] = None, portal: Optional[Union[VirtualApp, TestApp, Portal]] = None,
54
54
  schemas: Optional[List[dict]] = None, autoadd: Optional[dict] = None,
55
55
  order: Optional[List[str]] = None, prune: bool = True,
56
+ remove_empty_objects_from_lists: bool = True,
56
57
  ref_lookup_strategy: Optional[Callable] = None,
57
58
  ref_lookup_nocache: bool = False,
58
- norefs: bool = False,
59
+ norefs: bool = False, merge: bool = False,
59
60
  progress: Optional[Callable] = None,
60
61
  debug_sleep: Optional[str] = None) -> None:
61
62
  self._progress = progress if callable(progress) else None
@@ -65,7 +66,8 @@ class StructuredDataSet:
65
66
  ref_lookup_nocache=ref_lookup_nocache) if portal else None
66
67
  self._ref_lookup_strategy = ref_lookup_strategy
67
68
  self._order = order
68
- self._prune = prune
69
+ self._prune = prune is True
70
+ self._remove_empty_objects_from_lists = remove_empty_objects_from_lists is True
69
71
  self._warnings = {}
70
72
  self._errors = {}
71
73
  self._resolved_refs = set()
@@ -73,6 +75,7 @@ class StructuredDataSet:
73
75
  self._nrows = 0
74
76
  self._autoadd_properties = autoadd if isinstance(autoadd, dict) and autoadd else None
75
77
  self._norefs = True if norefs is True else False
78
+ self._merge = True if merge is True else False
76
79
  self._debug_sleep = None
77
80
  if debug_sleep:
78
81
  try:
@@ -93,14 +96,16 @@ class StructuredDataSet:
93
96
  def load(file: str, portal: Optional[Union[VirtualApp, TestApp, Portal]] = None,
94
97
  schemas: Optional[List[dict]] = None, autoadd: Optional[dict] = None,
95
98
  order: Optional[List[str]] = None, prune: bool = True,
99
+ remove_empty_objects_from_lists: bool = True,
96
100
  ref_lookup_strategy: Optional[Callable] = None,
97
101
  ref_lookup_nocache: bool = False,
98
- norefs: bool = False,
102
+ norefs: bool = False, merge: bool = False,
99
103
  progress: Optional[Callable] = None,
100
104
  debug_sleep: Optional[str] = None) -> StructuredDataSet:
101
105
  return StructuredDataSet(file=file, portal=portal, schemas=schemas, autoadd=autoadd, order=order, prune=prune,
106
+ remove_empty_objects_from_lists=remove_empty_objects_from_lists,
102
107
  ref_lookup_strategy=ref_lookup_strategy, ref_lookup_nocache=ref_lookup_nocache,
103
- norefs=norefs, progress=progress, debug_sleep=debug_sleep)
108
+ norefs=norefs, merge=merge, progress=progress, debug_sleep=debug_sleep)
104
109
 
105
110
  def validate(self, force: bool = False) -> None:
106
111
  def data_without_deleted_properties(data: dict) -> dict:
@@ -346,7 +351,18 @@ class StructuredDataSet:
346
351
 
347
352
  def _load_json_file(self, file: str) -> None:
348
353
  with open(file) as f:
349
- self._add(Schema.type_name(file), json.load(f))
354
+ file_json = json.load(f)
355
+ schema_inferred_from_file_name = Schema.type_name(file)
356
+ if self._portal.get_schema(schema_inferred_from_file_name) is not None:
357
+ # If the JSON file name looks like a schema name then assume it
358
+ # contains an object or an array of object of that schema type.
359
+ self._add(Schema.type_name(file), file_json)
360
+ elif isinstance(file_json, dict):
361
+ # Otherwise if the JSON file name does not look like a schema name then
362
+ # assume it a dictionary where each property is the name of a schema, and
363
+ # which (each property) contains a list of object of that schema type.
364
+ for schema_name in file_json:
365
+ self._add(schema_name, file_json[schema_name])
350
366
 
351
367
  def _load_reader(self, reader: RowReader, type_name: str) -> None:
352
368
  schema = None
@@ -368,7 +384,16 @@ class StructuredDataSet:
368
384
  structured_row_template.set_value(structured_row, column_name, value, reader.file, reader.row_number)
369
385
  if self._autoadd_properties:
370
386
  self._add_properties(structured_row, self._autoadd_properties, schema)
371
- self._add(type_name, structured_row)
387
+ # New merge functionality (2024-05-25).
388
+ if self._merge:
389
+ for identifying_path in self.get_identifying_paths(self._portal, structured_row, type_name):
390
+ if existing_portal_object := self._portal.get_metadata(identifying_path):
391
+ structured_row = merge_objects(existing_portal_object, structured_row)
392
+ if (prune_error := self._prune_structured_row(structured_row)) is not None:
393
+ self._note_error({"src": create_dict(type=schema_name, row=reader.row_number),
394
+ "error": prune_error}, "validation")
395
+ else:
396
+ self._add(type_name, structured_row)
372
397
  if self._progress:
373
398
  self._progress({
374
399
  PROGRESS.LOAD_ITEM: self._nrows,
@@ -385,9 +410,20 @@ class StructuredDataSet:
385
410
  self._note_error(schema._unresolved_refs, "ref")
386
411
  self._resolved_refs.update(schema._resolved_refs)
387
412
 
388
- def _add(self, type_name: str, data: Union[dict, List[dict]]) -> None:
389
- if self._prune:
413
+ def _prune_structured_row(self, data: dict) -> Optional[str]:
414
+ if not self._prune:
415
+ return None
416
+ if not self._remove_empty_objects_from_lists:
390
417
  remove_empty_properties(data)
418
+ return None
419
+ try:
420
+ remove_empty_properties(data, isempty_array_element=lambda element: element == {},
421
+ raise_exception_on_nonempty_array_element_after_empty=True)
422
+ except Exception as e:
423
+ return str(e)
424
+ return None
425
+
426
+ def _add(self, type_name: str, data: Union[dict, List[dict]]) -> None:
391
427
  if type_name in self._data:
392
428
  self._data[type_name].extend([data] if isinstance(data, dict) else data)
393
429
  else:
@@ -1,8 +1,11 @@
1
1
  from contextlib import contextmanager
2
+ from datetime import datetime
2
3
  import os
3
4
  import shutil
4
5
  import tempfile
6
+ from uuid import uuid4 as uuid
5
7
  from typing import List, Optional, Union
8
+ from dcicutils.file_utils import create_random_file
6
9
 
7
10
 
8
11
  @contextmanager
@@ -15,22 +18,59 @@ def temporary_directory() -> str:
15
18
 
16
19
 
17
20
  @contextmanager
18
- def temporary_file(name: Optional[str] = None, suffix: Optional[str] = None,
21
+ def temporary_file(name: Optional[str] = None, prefix: Optional[str] = None, suffix: Optional[str] = None,
19
22
  content: Optional[Union[str, bytes, List[str]]] = None) -> str:
20
23
  with temporary_directory() as tmp_directory_name:
21
- tmp_file_name = os.path.join(tmp_directory_name, name or tempfile.mktemp(dir="")) + (suffix or "")
22
- with open(tmp_file_name, "wb" if isinstance(content, bytes) else "w") as tmp_file:
24
+ tmp_file_name = f"{prefix or ''}{name or tempfile.mktemp(dir='')}{suffix or ''}"
25
+ tmp_file_path = os.path.join(tmp_directory_name, tmp_file_name)
26
+ with open(tmp_file_path, "wb" if isinstance(content, bytes) else "w") as tmp_file:
23
27
  if content is not None:
24
28
  tmp_file.write("\n".join(content) if isinstance(content, list) else content)
25
- yield tmp_file_name
29
+ yield tmp_file_path
30
+
31
+
32
+ def create_temporary_file_name(prefix: Optional[str] = None, suffix: Optional[str] = None) -> str:
33
+ """
34
+ Generates and returns the full path to file within the system temporary directory.
35
+ """
36
+ random_string = f"{datetime.utcnow().strftime('%Y%m%d%H%M%S')}{str(uuid()).replace('-', '')}"
37
+ tmp_file_name = f"{prefix or ''}{random_string}{suffix or ''}"
38
+ return os.path.join(tempfile.gettempdir(), tmp_file_name)
39
+
40
+
41
+ @contextmanager
42
+ def temporary_random_file(prefix: Optional[str] = None, suffix: Optional[str] = None,
43
+ nbytes: int = 1024, binary: bool = False, line_length: Optional[int] = None) -> str:
44
+ with temporary_file(prefix=prefix, suffix=suffix) as tmp_file_path:
45
+ create_random_file(tmp_file_path, nbytes=nbytes, binary=binary, line_length=line_length)
46
+ yield tmp_file_path
26
47
 
27
48
 
28
49
  def remove_temporary_directory(tmp_directory_name: str) -> None:
29
- def is_temporary_directory(path: str) -> bool:
30
- try:
31
- tmpdir = tempfile.gettempdir()
32
- return os.path.commonpath([path, tmpdir]) == tmpdir and os.path.exists(path) and os.path.isdir(path)
33
- except Exception:
34
- return False
50
+ """
51
+ Removes the given directory, recursively; but ONLY if it is (somewhere) within the system temporary directory.
52
+ """
35
53
  if is_temporary_directory(tmp_directory_name): # Guard against errant deletion.
36
54
  shutil.rmtree(tmp_directory_name)
55
+
56
+
57
+ def remove_temporary_file(tmp_file_name: str) -> bool:
58
+ """
59
+ Removes the given file; but ONLY if it is (somewhere) within the system temporary directory.
60
+ """
61
+ try:
62
+ tmpdir = tempfile.gettempdir()
63
+ if (os.path.commonpath([tmpdir, tmp_file_name]) == tmpdir) and os.path.isfile(tmp_file_name):
64
+ os.remove(tmp_file_name)
65
+ return True
66
+ return False
67
+ except Exception:
68
+ return False
69
+
70
+
71
+ def is_temporary_directory(path: str) -> bool:
72
+ try:
73
+ tmpdir = tempfile.gettempdir()
74
+ return os.path.commonpath([path, tmpdir]) == tmpdir and os.path.exists(path) and os.path.isdir(path)
75
+ except Exception:
76
+ return False
dcicutils/zip_utils.py CHANGED
@@ -2,7 +2,9 @@ from contextlib import contextmanager
2
2
  from dcicutils.tmpfile_utils import temporary_directory, temporary_file
3
3
  import gzip
4
4
  import os
5
+ import shutil
5
6
  import tarfile
7
+ import tempfile
6
8
  from typing import List, Optional
7
9
  import zipfile
8
10
 
@@ -45,3 +47,28 @@ def unpack_gz_file_to_temporary_file(file: str, suffix: Optional[str] = None) ->
45
47
  outputf.write(inputf.read())
46
48
  outputf.close()
47
49
  yield tmp_file_name
50
+
51
+
52
+ def extract_file_from_zip(zip_file: str, file_to_extract: str,
53
+ destination_file: str, raise_exception: bool = True) -> bool:
54
+ """
55
+ Extracts from the given zip file, the given file to extract, writing it to the
56
+ given destination file. Returns True if all is well, otherwise False, or if the
57
+ raise_exception argument is True (the default), then raises and exception on error.
58
+ """
59
+ try:
60
+ if not (destination_directory := os.path.dirname(destination_file)):
61
+ destination_directory = os.getcwd()
62
+ destination_file = os.path.join(destination_directory, destination_file)
63
+ with tempfile.TemporaryDirectory() as tmp_directory_name:
64
+ with zipfile.ZipFile(zip_file, "r") as zipf:
65
+ if file_to_extract not in zipf.namelist():
66
+ return False
67
+ zipf.extract(file_to_extract, path=tmp_directory_name)
68
+ os.makedirs(destination_directory, exist_ok=True)
69
+ shutil.move(os.path.join(tmp_directory_name, file_to_extract), destination_file)
70
+ return True
71
+ except Exception as e:
72
+ if raise_exception:
73
+ raise e
74
+ return False
@@ -1,12 +1,12 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: dcicutils
3
- Version: 8.8.5
3
+ Version: 8.8.6.1b1
4
4
  Summary: Utility package for interacting with the 4DN Data Portal and other 4DN resources
5
5
  Home-page: https://github.com/4dn-dcic/utils
6
6
  License: MIT
7
7
  Author: 4DN-DCIC Team
8
8
  Author-email: support@4dnucleome.org
9
- Requires-Python: >=3.8,<3.12
9
+ Requires-Python: >=3.8,<3.13
10
10
  Classifier: Development Status :: 4 - Beta
11
11
  Classifier: Intended Audience :: Developers
12
12
  Classifier: Intended Audience :: Science/Research
@@ -24,9 +24,10 @@ Classifier: Programming Language :: Python :: 3.9
24
24
  Classifier: Topic :: Database :: Database Engines/Servers
25
25
  Requires-Dist: PyJWT (>=2.6.0,<3.0.0)
26
26
  Requires-Dist: PyYAML (>=6.0.1,<7.0.0)
27
+ Requires-Dist: appdirs (>=1.4.4,<2.0.0)
27
28
  Requires-Dist: aws-requests-auth (>=0.4.2,<1)
28
- Requires-Dist: boto3 (>=1.28.57,<2.0.0)
29
- Requires-Dist: botocore (>=1.31.57,<2.0.0)
29
+ Requires-Dist: boto3 (>=1.34.93,<2.0.0)
30
+ Requires-Dist: botocore (>=1.34.93,<2.0.0)
30
31
  Requires-Dist: chardet (>=5.2.0,<6.0.0)
31
32
  Requires-Dist: docker (>=4.4.4,<5.0.0)
32
33
  Requires-Dist: elasticsearch (==7.13.4)
@@ -42,6 +43,7 @@ Requires-Dist: pytz (>=2020.4)
42
43
  Requires-Dist: redis (>=4.5.1,<5.0.0)
43
44
  Requires-Dist: requests (>=2.21.0,<3.0.0)
44
45
  Requires-Dist: rfc3986 (>=1.4.0,<2.0.0)
46
+ Requires-Dist: shortuuid (>=1.0.13,<2.0.0)
45
47
  Requires-Dist: structlog (>=19.2.0,<20.0.0)
46
48
  Requires-Dist: toml (>=0.10.1,<1)
47
49
  Requires-Dist: tqdm (>=4.66.2,<5.0.0)
@@ -27,10 +27,11 @@ dcicutils/env_utils_legacy.py,sha256=J81OAtJHN69o1beHO6q1j7_J6TeblSjnAHlS8VA5KSM
27
27
  dcicutils/es_utils.py,sha256=ZksLh5ei7kRUfiFltk8sd2ZSfh15twbstrMzBr8HNw4,7541
28
28
  dcicutils/exceptions.py,sha256=4giQGtpak-omQv7BP6Ckeu91XK5fnDosC8gfdmN_ccA,9931
29
29
  dcicutils/ff_mocks.py,sha256=6RKS4eUiu_Wl8yP_8V0CaV75w4ZdWxdCuL1CVlnMrek,36918
30
- dcicutils/ff_utils.py,sha256=Yf-fET5gdpjrH0gikpOCIJdY2Dv3obzUpR31ur816mU,72972
31
- dcicutils/file_utils.py,sha256=098rXvLeIh8n69EGW7DpOS227ef3BPgwhRAktoU6mhE,2663
30
+ dcicutils/ff_utils.py,sha256=oIhuZPnGtfwj6bWyCc1u23JbMB_6InPp01ZqUOljd8M,73123
31
+ dcicutils/file_utils.py,sha256=zyNdRl1Fu3SrQwjJWaIMvQpi4DRaodNZCX7oTkiPJ-A,10916
32
32
  dcicutils/function_cache_decorator.py,sha256=XMyiEGODVr2WoAQ68vcoX_9_Xb9p8pZXdXl7keU8i2g,10026
33
33
  dcicutils/glacier_utils.py,sha256=Q4CVXsZCbP-SoZIsZ5NMcawDfelOLzbQnIlQn-GdlTo,34149
34
+ dcicutils/http_utils.py,sha256=tNfH5JA-OwbQKEvD5HPJ3lcp2TSIZ4rnl__4d4JO8Gw,1583
34
35
  dcicutils/jh_utils.py,sha256=Gpsxb9XEzggF_-Eq3ukjKvTnuyb9V1SCSUXkXsES4Kg,11502
35
36
  dcicutils/kibana/dashboards.json,sha256=wHMB_mpJ8OaYhRRgvpZuihaB2lmSF64ADt_8hkBWgQg,16225
36
37
  dcicutils/kibana/readme.md,sha256=3KmHF9FH6A6xwYsNxRFLw27q0XzHYnjZOlYUnn3VkQQ,2164
@@ -43,11 +44,11 @@ dcicutils/license_policies/park-lab-gpl-pipeline.jsonc,sha256=vLZkwm3Js-kjV44nug
43
44
  dcicutils/license_policies/park-lab-pipeline.jsonc,sha256=9qlY0ASy3iUMQlr3gorVcXrSfRHnVGbLhkS427UaRy4,283
44
45
  dcicutils/license_utils.py,sha256=d1cq6iwv5Ju-VjdoINi6q7CPNNL7Oz6rcJdLMY38RX0,46978
45
46
  dcicutils/log_utils.py,sha256=7pWMc6vyrorUZQf-V-M3YC6zrPgNhuV_fzm9xqTPph0,10883
46
- dcicutils/misc_utils.py,sha256=YH_TTmv6ABWeMERwVvA2-rIfdS-CoPYLXJru9TvWxgM,104610
47
+ dcicutils/misc_utils.py,sha256=zHwsxxEn24muLBP7mDvMa8I9VdMejwW8HMuCL5xbhhw,107690
47
48
  dcicutils/obfuscation_utils.py,sha256=fo2jOmDRC6xWpYX49u80bVNisqRRoPskFNX3ymFAmjw,5963
48
49
  dcicutils/opensearch_utils.py,sha256=V2exmFYW8Xl2_pGFixF4I2Cc549Opwe4PhFi5twC0M8,1017
49
50
  dcicutils/portal_object_utils.py,sha256=gDXRgPsRvqCFwbC8WatsuflAxNiigOnqr0Hi93k3AgE,15422
50
- dcicutils/portal_utils.py,sha256=DYyE5o15GekDgzpJWas9iS7klAYbjJZUPW0G42McArk,30779
51
+ dcicutils/portal_utils.py,sha256=_uLdB-ulmFqmClA_Dkpxe4gfEfzSMJSu4yDmtpmqXwQ,33402
51
52
  dcicutils/progress_bar.py,sha256=UT7lxb-rVF_gp4yjY2Tg4eun1naaH__hB4_v3O85bcE,19468
52
53
  dcicutils/project_utils.py,sha256=qPdCaFmWUVBJw4rw342iUytwdQC0P-XKpK4mhyIulMM,31250
53
54
  dcicutils/qa_checkers.py,sha256=cdXjeL0jCDFDLT8VR8Px78aS10hwNISOO5G_Zv2TZ6M,20534
@@ -58,22 +59,22 @@ dcicutils/s3_utils.py,sha256=LauLFQGvZLfpBJ81tYMikjLd3SJRz2R_FrL1n4xSlyI,28868
58
59
  dcicutils/schema_utils.py,sha256=IhtozG2jQ7bFyn54iPEdmDrHoCf3ryJXeXvPJRBXNn0,10095
59
60
  dcicutils/scripts/publish_to_pypi.py,sha256=LFzNHIQK2EXFr88YcfctyA_WKEBFc1ElnSjWrCXedPM,13889
60
61
  dcicutils/scripts/run_license_checker.py,sha256=z2keYnRDZsHQbTeo1XORAXSXNJK5axVzL5LjiNqZ7jE,4184
61
- dcicutils/scripts/view_portal_object.py,sha256=Cy-8GwGJS9EX-5RxE8mjsqNlDT0N6OCpkNffPVkTFQc,26262
62
+ dcicutils/scripts/view_portal_object.py,sha256=HZzM44BDcGycO9XTOTZyP-F7PRMZaZrnFfiqiT7Qvqg,29777
62
63
  dcicutils/secrets_utils.py,sha256=8dppXAsiHhJzI6NmOcvJV5ldvKkQZzh3Fl-cb8Wm7MI,19745
63
64
  dcicutils/sheet_utils.py,sha256=VlmzteONW5VF_Q4vo0yA5vesz1ViUah1MZ_yA1rwZ0M,33629
64
65
  dcicutils/snapshot_utils.py,sha256=ymP7PXH6-yEiXAt75w0ldQFciGNqWBClNxC5gfX2FnY,22961
65
66
  dcicutils/ssl_certificate_utils.py,sha256=F0ifz_wnRRN9dfrfsz7aCp4UDLgHEY8LaK7PjnNvrAQ,9707
66
- dcicutils/structured_data.py,sha256=BQuIMv6OPySsn6YxtXE2Er-zLE2QJuCYhEQ3V0u_UXY,61238
67
+ dcicutils/structured_data.py,sha256=z0QMgbFafJWoOUMwJJDVufgeT7r7fTTasx1ry5axMVM,63546
67
68
  dcicutils/submitr/progress_constants.py,sha256=5bxyX77ql8qEJearfHEvsvXl7D0GuUODW0T65mbRmnE,2895
68
69
  dcicutils/submitr/ref_lookup_strategy.py,sha256=Js2cVznTmgjciLWBPLCvMiwLIHXjDn3jww-gJPjYuFw,3467
69
70
  dcicutils/task_utils.py,sha256=MF8ujmTD6-O2AC2gRGPHyGdUrVKgtr8epT5XU8WtNjk,8082
70
- dcicutils/tmpfile_utils.py,sha256=n95XF8dZVbQRSXBZTGToXXfSs3JUVRyN6c3ZZ0nhAWI,1403
71
+ dcicutils/tmpfile_utils.py,sha256=irmN6Otvtxyum-7qr5h9GIzDs9rtFFyUsGQyqJXd_y4,2997
71
72
  dcicutils/trace_utils.py,sha256=g8kwV4ebEy5kXW6oOrEAUsurBcCROvwtZqz9fczsGRE,1769
72
73
  dcicutils/validation_utils.py,sha256=cMZIU2cY98FYtzK52z5WUYck7urH6JcqOuz9jkXpqzg,14797
73
74
  dcicutils/variant_utils.py,sha256=2H9azNx3xAj-MySg-uZ2SFqbWs4kZvf61JnK6b-h4Qw,4343
74
- dcicutils/zip_utils.py,sha256=rnjNv_k6L9jT2SjDSgVXp4BEJYLtz9XN6Cl2Fy-tqnM,2027
75
- dcicutils-8.8.5.dist-info/LICENSE.txt,sha256=qnwSmfnEWMl5l78VPDEzAmEbLVrRqQvfUQiHT0ehrOo,1102
76
- dcicutils-8.8.5.dist-info/METADATA,sha256=UqVJjm2EYmUXtqMXxqTf1QLhabJL4P3QFe1tZzUW-rg,3352
77
- dcicutils-8.8.5.dist-info/WHEEL,sha256=7Z8_27uaHI_UZAc4Uox4PpBhQ9Y5_modZXWMxtUi4NU,88
78
- dcicutils-8.8.5.dist-info/entry_points.txt,sha256=51Q4F_2V10L0282W7HFjP4jdzW4K8lnWDARJQVFy_hw,270
79
- dcicutils-8.8.5.dist-info/RECORD,,
75
+ dcicutils/zip_utils.py,sha256=_Y9EmL3D2dUZhxucxHvrtmmlbZmK4FpSsHEb7rGSJLU,3265
76
+ dcicutils-8.8.6.1b1.dist-info/LICENSE.txt,sha256=qnwSmfnEWMl5l78VPDEzAmEbLVrRqQvfUQiHT0ehrOo,1102
77
+ dcicutils-8.8.6.1b1.dist-info/METADATA,sha256=5iidFphml1M_LwEmfPJdZnLcaSqT2FflV9Ld2JmeCWk,3439
78
+ dcicutils-8.8.6.1b1.dist-info/WHEEL,sha256=7Z8_27uaHI_UZAc4Uox4PpBhQ9Y5_modZXWMxtUi4NU,88
79
+ dcicutils-8.8.6.1b1.dist-info/entry_points.txt,sha256=51Q4F_2V10L0282W7HFjP4jdzW4K8lnWDARJQVFy_hw,270
80
+ dcicutils-8.8.6.1b1.dist-info/RECORD,,