dcicutils 8.13.3.1b25__py3-none-any.whl → 8.13.3.1b27__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- dcicutils/misc_utils.py +86 -59
- dcicutils/structured_data.py +7 -7
- {dcicutils-8.13.3.1b25.dist-info → dcicutils-8.13.3.1b27.dist-info}/METADATA +1 -1
- {dcicutils-8.13.3.1b25.dist-info → dcicutils-8.13.3.1b27.dist-info}/RECORD +7 -7
- {dcicutils-8.13.3.1b25.dist-info → dcicutils-8.13.3.1b27.dist-info}/LICENSE.txt +0 -0
- {dcicutils-8.13.3.1b25.dist-info → dcicutils-8.13.3.1b27.dist-info}/WHEEL +0 -0
- {dcicutils-8.13.3.1b25.dist-info → dcicutils-8.13.3.1b27.dist-info}/entry_points.txt +0 -0
dcicutils/misc_utils.py
CHANGED
@@ -986,57 +986,73 @@ def str_to_bool(x: Optional[str]) -> Optional[bool]:
|
|
986
986
|
raise ValueError(f"An argument to str_or_bool must be a string or None: {x!r}")
|
987
987
|
|
988
988
|
|
989
|
-
def to_integer(value: str,
|
990
|
-
|
991
|
-
|
992
|
-
|
993
|
-
|
994
|
-
|
995
|
-
|
996
|
-
|
997
|
-
|
998
|
-
|
999
|
-
|
1000
|
-
|
1001
|
-
|
1002
|
-
|
1003
|
-
|
1004
|
-
|
1005
|
-
|
1006
|
-
|
1007
|
-
|
1008
|
-
|
1009
|
-
|
1010
|
-
|
1011
|
-
|
1012
|
-
|
1013
|
-
"
|
1014
|
-
"
|
989
|
+
def to_integer(value: str,
|
990
|
+
allow_commas: bool = False,
|
991
|
+
allow_multiplier_suffix: bool = False,
|
992
|
+
fallback: Optional[Union[int, float]] = None) -> Optional[int]:
|
993
|
+
return to_number(value, fallback=fallback, as_float=False,
|
994
|
+
allow_commas=allow_commas,
|
995
|
+
allow_multiplier_suffix=allow_multiplier_suffix)
|
996
|
+
|
997
|
+
|
998
|
+
def to_float(value: str,
|
999
|
+
allow_commas: bool = False,
|
1000
|
+
allow_multiplier_suffix: bool = False,
|
1001
|
+
fallback: Optional[Union[int, float]] = None) -> Optional[int]:
|
1002
|
+
return to_number(value, fallback=fallback, as_float=True,
|
1003
|
+
allow_commas=allow_commas,
|
1004
|
+
allow_multiplier_suffix=allow_multiplier_suffix)
|
1005
|
+
|
1006
|
+
|
1007
|
+
_TO_NUMBER_MULTIPLIER_K = 1000
|
1008
|
+
_TO_NUMBER_MULTIPLIER_M = 1000 * _TO_NUMBER_MULTIPLIER_K
|
1009
|
+
_TO_NUMBER_MULTIPLIER_G = 1000 * _TO_NUMBER_MULTIPLIER_M
|
1010
|
+
_TO_NUMBER_MULTIPLIER_T = 1000 * _TO_NUMBER_MULTIPLIER_G
|
1011
|
+
|
1012
|
+
_TO_NUMBER_MULTIPLIER_SUFFIXES = {
|
1013
|
+
"K": _TO_NUMBER_MULTIPLIER_K,
|
1014
|
+
"KB": _TO_NUMBER_MULTIPLIER_K,
|
1015
|
+
"M": _TO_NUMBER_MULTIPLIER_M,
|
1016
|
+
"MB": _TO_NUMBER_MULTIPLIER_M,
|
1017
|
+
"G": _TO_NUMBER_MULTIPLIER_G,
|
1018
|
+
"GB": _TO_NUMBER_MULTIPLIER_G,
|
1019
|
+
"T": _TO_NUMBER_MULTIPLIER_T,
|
1020
|
+
"TB": _TO_NUMBER_MULTIPLIER_T
|
1015
1021
|
}
|
1016
1022
|
|
1017
1023
|
|
1018
1024
|
def to_number(value: str,
|
1025
|
+
as_float: bool = False,
|
1019
1026
|
allow_commas: bool = False,
|
1020
1027
|
allow_multiplier_suffix: bool = False,
|
1021
|
-
allow_float: bool = False,
|
1022
1028
|
fallback: Optional[Union[int, float]] = None) -> Optional[Union[int, float]]:
|
1023
|
-
|
1024
1029
|
"""
|
1025
|
-
Converts the
|
1026
|
-
|
1027
|
-
|
1028
|
-
|
1029
|
-
|
1030
|
-
|
1031
|
-
|
1032
|
-
|
1030
|
+
Converts the given string value to an int, or float if as_float is True,
|
1031
|
+
or None or the give fallback value if malformed.
|
1032
|
+
|
1033
|
+
If allow_commas is True then allows appropriately placed commas (i.e. every three digits).
|
1034
|
+
|
1035
|
+
If allow_multiplier_suffix is True allows any of the multiplier suffixes K, KB; M, MB;
|
1036
|
+
or G, GB; or T, TB; all case-insensitive; which will multiply the value by a thousand;
|
1037
|
+
a million; a billion; or a trillion; respectively.
|
1038
|
+
|
1039
|
+
If as_float is True then value is parsed and returned as a float rather than int.
|
1040
|
+
|
1041
|
+
Note that even if as_float is False, values that might LOOK like a float, can be
|
1042
|
+
an int, for example, "1.5K", returns 1500 as an int since it is; but "1.5002K"
|
1043
|
+
is malformed, since 1.5002K is equivalent to 1500.2 which is not an int.
|
1033
1044
|
"""
|
1045
|
+
|
1034
1046
|
if not (isinstance(value, str) and (value := value.strip())):
|
1035
|
-
|
1047
|
+
# Just in case the value is already the actual/desired return type.
|
1048
|
+
if as_float is True:
|
1049
|
+
return float(value) if isinstance(value, (float, int)) else fallback
|
1050
|
+
else:
|
1051
|
+
return value if isinstance(value, int) else fallback
|
1036
1052
|
|
1037
1053
|
value_multiplier = 1
|
1038
|
-
value_negative = False
|
1039
1054
|
value_fraction = None
|
1055
|
+
value_negative = False
|
1040
1056
|
|
1041
1057
|
if value.startswith("-"):
|
1042
1058
|
if not (value := value[1:].strip()):
|
@@ -1048,23 +1064,31 @@ def to_number(value: str,
|
|
1048
1064
|
|
1049
1065
|
if allow_multiplier_suffix is True:
|
1050
1066
|
value_upper = value.upper()
|
1051
|
-
for suffix in
|
1067
|
+
for suffix in _TO_NUMBER_MULTIPLIER_SUFFIXES:
|
1052
1068
|
if value_upper.endswith(suffix):
|
1053
|
-
value_multiplier *=
|
1069
|
+
value_multiplier *= _TO_NUMBER_MULTIPLIER_SUFFIXES[suffix]
|
1054
1070
|
if not (value := value[:-len(suffix)].strip()):
|
1055
1071
|
return fallback
|
1056
1072
|
break
|
1057
1073
|
|
1058
|
-
if
|
1074
|
+
if (allow_multiplier_suffix is True) or (as_float is True):
|
1075
|
+
# Allow for example "1.5K" to mean 1500 (integer).
|
1059
1076
|
if (dot_index := value.rfind(".")) >= 0:
|
1060
1077
|
if value_fraction := value[dot_index + 1:].strip():
|
1061
1078
|
try:
|
1062
1079
|
value_fraction = float(f"0.{value_fraction}")
|
1063
1080
|
except Exception:
|
1064
1081
|
return fallback
|
1065
|
-
value
|
1082
|
+
if not (value := value[:dot_index].strip()):
|
1083
|
+
if not value_fraction:
|
1084
|
+
return fallback
|
1085
|
+
value = "0"
|
1086
|
+
elif (as_float is not True) and (value_dot_zero_suffix := re.search(r"\.0*$", value)):
|
1087
|
+
# Allow for example "123.00" to mean 123 (integer).
|
1088
|
+
value = value[:value_dot_zero_suffix.start()]
|
1066
1089
|
|
1067
1090
|
if (allow_commas is True) and ("," in value):
|
1091
|
+
# Make sure that any commas are properly placed.
|
1068
1092
|
if not re.fullmatch(r"(-?\d{1,3}(,\d{3})*)", value):
|
1069
1093
|
return fallback
|
1070
1094
|
value = value.replace(",", "")
|
@@ -1072,28 +1096,31 @@ def to_number(value: str,
|
|
1072
1096
|
if not value.isdigit():
|
1073
1097
|
return fallback
|
1074
1098
|
|
1075
|
-
|
1099
|
+
value = float(value) if as_float is True else int(value)
|
1076
1100
|
|
1077
1101
|
if value_fraction:
|
1078
|
-
|
1079
|
-
|
1080
|
-
|
1102
|
+
value_float = float(value) + value_fraction
|
1103
|
+
# Here we do NOT simply do: value_float *= float(value_multiplier);
|
1104
|
+
# because it introduces obvious FLOATing point precision ERRORs; for example,
|
1105
|
+
# to_integer("1.5678K", allow_multiplier_suffix=True) would yield 1567.8000000000002
|
1106
|
+
# if we simply did 1.5678 * 1000.0; but doing the multiplication 10 at a time obviates this
|
1107
|
+
# idiosyncracy yielding 1567.8; this ASSUMES that the multipliers are simple multiples of 10.
|
1108
|
+
while value_multiplier > 1:
|
1109
|
+
value_float *= 10
|
1110
|
+
value_multiplier /= 10
|
1111
|
+
if as_float is True:
|
1112
|
+
value = value_float
|
1113
|
+
else:
|
1114
|
+
value = int(value_float)
|
1115
|
+
if value_float != value:
|
1116
|
+
return fallback
|
1117
|
+
else:
|
1118
|
+
value *= value_multiplier
|
1081
1119
|
|
1082
1120
|
if value_negative:
|
1083
|
-
|
1084
|
-
|
1085
|
-
if allow_float is True:
|
1086
|
-
if result == int(result):
|
1087
|
-
result = int(result)
|
1121
|
+
value = -value
|
1088
1122
|
|
1089
|
-
return
|
1090
|
-
|
1091
|
-
|
1092
|
-
def to_float(value: str, fallback: Optional[Any] = None) -> Optional[Any]:
|
1093
|
-
try:
|
1094
|
-
return float(value)
|
1095
|
-
except Exception:
|
1096
|
-
return fallback
|
1123
|
+
return value
|
1097
1124
|
|
1098
1125
|
|
1099
1126
|
def to_boolean(value: str, fallback: Optional[Any]) -> Optional[Any]:
|
dcicutils/structured_data.py
CHANGED
@@ -13,7 +13,7 @@ from dcicutils.data_readers import CsvReader, Excel, RowReader
|
|
13
13
|
from dcicutils.datetime_utils import normalize_date_string, normalize_datetime_string
|
14
14
|
from dcicutils.misc_utils import (create_dict, create_readonly_object, is_uuid, load_json_if,
|
15
15
|
merge_objects, remove_empty_properties, right_trim, split_string,
|
16
|
-
to_boolean, to_enum,
|
16
|
+
to_boolean, to_enum, to_float, to_integer, VirtualApp)
|
17
17
|
from dcicutils.portal_object_utils import PortalObject
|
18
18
|
from dcicutils.portal_utils import Portal as PortalBase
|
19
19
|
from dcicutils.submitr.progress_constants import PROGRESS_PARSE as PROGRESS
|
@@ -727,9 +727,9 @@ class Schema(SchemaBase):
|
|
727
727
|
allow_multiplier_suffix = typeinfo.get("allow_multiplier_suffix") is True
|
728
728
|
def map_integer(value: str, src: Optional[str]) -> Any: # noqa
|
729
729
|
nonlocal allow_commas, allow_multiplier_suffix
|
730
|
-
return
|
731
|
-
|
732
|
-
|
730
|
+
return to_integer(value, fallback=value,
|
731
|
+
allow_commas=allow_commas,
|
732
|
+
allow_multiplier_suffix=allow_multiplier_suffix)
|
733
733
|
return map_integer
|
734
734
|
|
735
735
|
def _map_function_number(self, typeinfo: dict) -> Callable:
|
@@ -737,9 +737,9 @@ class Schema(SchemaBase):
|
|
737
737
|
allow_multiplier_suffix = typeinfo.get("allow_multiplier_suffix") is True
|
738
738
|
def map_number(value: str, src: Optional[str]) -> Any: # noqa
|
739
739
|
nonlocal allow_commas, allow_multiplier_suffix
|
740
|
-
return
|
741
|
-
|
742
|
-
|
740
|
+
return to_float(value, fallback=value,
|
741
|
+
allow_commas=allow_commas,
|
742
|
+
allow_multiplier_suffix=allow_multiplier_suffix)
|
743
743
|
return map_number
|
744
744
|
|
745
745
|
def _map_function_string(self, typeinfo: dict) -> Callable:
|
@@ -45,7 +45,7 @@ dcicutils/license_policies/park-lab-gpl-pipeline.jsonc,sha256=vLZkwm3Js-kjV44nug
|
|
45
45
|
dcicutils/license_policies/park-lab-pipeline.jsonc,sha256=9qlY0ASy3iUMQlr3gorVcXrSfRHnVGbLhkS427UaRy4,283
|
46
46
|
dcicutils/license_utils.py,sha256=2Yxnh1T1iuMe6wluwbvpFO_zYSGPxB4-STAMc-vz-YM,47202
|
47
47
|
dcicutils/log_utils.py,sha256=7pWMc6vyrorUZQf-V-M3YC6zrPgNhuV_fzm9xqTPph0,10883
|
48
|
-
dcicutils/misc_utils.py,sha256=
|
48
|
+
dcicutils/misc_utils.py,sha256=R3nUtmx4nynmdTfc98w3CV2JKYCPZPRBijets1nWM20,114877
|
49
49
|
dcicutils/obfuscation_utils.py,sha256=fo2jOmDRC6xWpYX49u80bVNisqRRoPskFNX3ymFAmjw,5963
|
50
50
|
dcicutils/opensearch_utils.py,sha256=V2exmFYW8Xl2_pGFixF4I2Cc549Opwe4PhFi5twC0M8,1017
|
51
51
|
dcicutils/portal_object_utils.py,sha256=Az3n1aL-PQkN5gOFE6ZqC2XkYsqiwKlq7-tZggs1QN4,11062
|
@@ -66,7 +66,7 @@ dcicutils/secrets_utils.py,sha256=8dppXAsiHhJzI6NmOcvJV5ldvKkQZzh3Fl-cb8Wm7MI,19
|
|
66
66
|
dcicutils/sheet_utils.py,sha256=VlmzteONW5VF_Q4vo0yA5vesz1ViUah1MZ_yA1rwZ0M,33629
|
67
67
|
dcicutils/snapshot_utils.py,sha256=YDeI3vD-MhAtHwKDzfEm2q-n3l-da2yRpRR3xp0Ah1M,23021
|
68
68
|
dcicutils/ssl_certificate_utils.py,sha256=F0ifz_wnRRN9dfrfsz7aCp4UDLgHEY8LaK7PjnNvrAQ,9707
|
69
|
-
dcicutils/structured_data.py,sha256=
|
69
|
+
dcicutils/structured_data.py,sha256=LN-Bn-RUM_jy0T6s-ovZT9QXDsQ8w1_QVtkb8LAHFs4,66119
|
70
70
|
dcicutils/submitr/progress_constants.py,sha256=5bxyX77ql8qEJearfHEvsvXl7D0GuUODW0T65mbRmnE,2895
|
71
71
|
dcicutils/submitr/ref_lookup_strategy.py,sha256=VJN-Oo0LLna6Vo2cu47eC-eU-yUC9NFlQP29xajejVU,4741
|
72
72
|
dcicutils/task_utils.py,sha256=MF8ujmTD6-O2AC2gRGPHyGdUrVKgtr8epT5XU8WtNjk,8082
|
@@ -75,8 +75,8 @@ dcicutils/trace_utils.py,sha256=g8kwV4ebEy5kXW6oOrEAUsurBcCROvwtZqz9fczsGRE,1769
|
|
75
75
|
dcicutils/validation_utils.py,sha256=cMZIU2cY98FYtzK52z5WUYck7urH6JcqOuz9jkXpqzg,14797
|
76
76
|
dcicutils/variant_utils.py,sha256=2H9azNx3xAj-MySg-uZ2SFqbWs4kZvf61JnK6b-h4Qw,4343
|
77
77
|
dcicutils/zip_utils.py,sha256=_Y9EmL3D2dUZhxucxHvrtmmlbZmK4FpSsHEb7rGSJLU,3265
|
78
|
-
dcicutils-8.13.3.
|
79
|
-
dcicutils-8.13.3.
|
80
|
-
dcicutils-8.13.3.
|
81
|
-
dcicutils-8.13.3.
|
82
|
-
dcicutils-8.13.3.
|
78
|
+
dcicutils-8.13.3.1b27.dist-info/LICENSE.txt,sha256=qnwSmfnEWMl5l78VPDEzAmEbLVrRqQvfUQiHT0ehrOo,1102
|
79
|
+
dcicutils-8.13.3.1b27.dist-info/METADATA,sha256=w4K_ZFbf-pBM62p35V5NoZS4HQWx0jlimtBQ2z73pQE,3440
|
80
|
+
dcicutils-8.13.3.1b27.dist-info/WHEEL,sha256=7Z8_27uaHI_UZAc4Uox4PpBhQ9Y5_modZXWMxtUi4NU,88
|
81
|
+
dcicutils-8.13.3.1b27.dist-info/entry_points.txt,sha256=W6kEWdUJk9tQ4myAgpehPdebcwvCAZ7UgB-wyPgDUMg,335
|
82
|
+
dcicutils-8.13.3.1b27.dist-info/RECORD,,
|
File without changes
|
File without changes
|
File without changes
|