hestia-earth-utils 0.15.13__tar.gz → 0.15.15__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (44) hide show
  1. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/PKG-INFO +1 -1
  2. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth/utils/emission.py +10 -2
  3. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth/utils/lookup_utils.py +63 -49
  4. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth/utils/pivot/_shared.py +16 -0
  5. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth/utils/pivot/pivot_csv.py +2 -2
  6. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth/utils/pivot/pivot_json.py +10 -10
  7. hestia_earth_utils-0.15.15/hestia_earth/utils/version.py +1 -0
  8. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth_utils.egg-info/PKG-INFO +1 -1
  9. hestia_earth_utils-0.15.13/hestia_earth/utils/version.py +0 -1
  10. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/MANIFEST.in +0 -0
  11. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/README.md +0 -0
  12. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/bin/hestia-format-upload +0 -0
  13. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/bin/hestia-pivot-csv +0 -0
  14. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth/__init__.py +0 -0
  15. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth/utils/__init__.py +0 -0
  16. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth/utils/api.py +0 -0
  17. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth/utils/blank_node.py +0 -0
  18. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth/utils/calculation_status.py +0 -0
  19. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth/utils/cycle.py +0 -0
  20. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth/utils/date.py +0 -0
  21. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth/utils/descriptive_stats.py +0 -0
  22. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth/utils/lookup.py +0 -0
  23. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth/utils/model.py +0 -0
  24. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth/utils/pipeline.py +0 -0
  25. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth/utils/pivot/__init__.py +0 -0
  26. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth/utils/request.py +0 -0
  27. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth/utils/stats.py +0 -0
  28. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth/utils/storage/__init__.py +0 -0
  29. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth/utils/storage/_azure_client.py +0 -0
  30. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth/utils/storage/_local_client.py +0 -0
  31. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth/utils/storage/_s3_client.py +0 -0
  32. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth/utils/storage/_sns_client.py +0 -0
  33. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth/utils/table.py +0 -0
  34. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth/utils/term.py +0 -0
  35. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth/utils/tools.py +0 -0
  36. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth_utils.egg-info/SOURCES.txt +0 -0
  37. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth_utils.egg-info/dependency_links.txt +0 -0
  38. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth_utils.egg-info/requires.txt +0 -0
  39. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/hestia_earth_utils.egg-info/top_level.txt +0 -0
  40. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/setup.cfg +0 -0
  41. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/setup.py +0 -0
  42. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/tests/pivot/__init__.py +0 -0
  43. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/tests/pivot/test_pivot_csv.py +0 -0
  44. {hestia_earth_utils-0.15.13 → hestia_earth_utils-0.15.15}/tests/pivot/test_pivot_json.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: hestia_earth_utils
3
- Version: 0.15.13
3
+ Version: 0.15.15
4
4
  Summary: HESTIA's utils library
5
5
  Home-page: https://gitlab.com/hestia-earth/hestia-utils
6
6
  Author: HESTIA Team
@@ -9,7 +9,11 @@ from .lookup_utils import (
9
9
  is_product_termType_allowed,
10
10
  is_product_id_allowed,
11
11
  is_input_termType_allowed,
12
- is_input_id_allowed
12
+ is_input_id_allowed,
13
+ is_practice_termType_allowed,
14
+ is_practice_id_allowed,
15
+ is_transformation_termType_allowed,
16
+ is_transformation_id_allowed,
13
17
  )
14
18
 
15
19
 
@@ -35,7 +39,11 @@ def cycle_emission_is_in_system_boundary(cycle: dict):
35
39
  is_product_termType_allowed,
36
40
  is_product_id_allowed,
37
41
  is_input_termType_allowed,
38
- is_input_id_allowed
42
+ is_input_id_allowed,
43
+ is_practice_termType_allowed,
44
+ is_practice_id_allowed,
45
+ is_transformation_termType_allowed,
46
+ is_transformation_id_allowed,
39
47
  ]))
40
48
 
41
49
  return filter_term
@@ -1,5 +1,6 @@
1
1
  from functools import lru_cache
2
2
  import json
3
+ from hestia_earth.schema import SchemaType
3
4
 
4
5
  from .lookup import _download_lookup_data, download_lookup, get_table_value, column_name
5
6
  from .api import download_hestia
@@ -35,6 +36,10 @@ def _get_site_measurements(node: dict):
35
36
  return flatten([non_empty_list(site.get('measurements', [])) for site in sites])
36
37
 
37
38
 
39
+ def _blank_node_term_values(blank_nodes: list, key: str = '@id'):
40
+ return non_empty_list([v.get('term', {}).get(key) for v in blank_nodes])
41
+
42
+
38
43
  @lru_cache()
39
44
  def _allowed_model_mapping(model: str, term_id: str, column: str):
40
45
  mapping = _allowed_mapping_data()
@@ -45,22 +50,23 @@ def _allowed_model_mapping(model: str, term_id: str, column: str):
45
50
  return (value or _ALLOW_ALL).split(';') if isinstance(value, str) else _ALLOW_ALL
46
51
 
47
52
 
53
+ def _is_model_value_allowed(model: str, term_id: str, values: list, lookup_column: str):
54
+ allowed_values = _allowed_model_mapping(model, term_id, lookup_column)
55
+ return any([
56
+ _ALLOW_ALL in allowed_values,
57
+ len(values) == 0
58
+ ]) or any([value in allowed_values for value in values])
59
+
60
+
48
61
  def is_model_siteType_allowed(model: str, term_id: str, data: dict):
49
- site_types = _get_site_types(data)
50
- allowed_values = _allowed_model_mapping(model, term_id, 'siteTypesAllowed')
51
- return True if _ALLOW_ALL in allowed_values or not site_types else any([
52
- (site_type in allowed_values) for site_type in site_types
53
- ])
62
+ values = _get_site_types(data)
63
+ return _is_model_value_allowed(model, term_id, values, 'siteTypesAllowed')
54
64
 
55
65
 
56
66
  def is_model_product_id_allowed(model: str, term_id: str, data: dict):
57
67
  products = data.get('products', [])
58
- values = non_empty_list([p.get('term', {}).get('@id') for p in products])
59
- allowed_values = _allowed_model_mapping(model, term_id, 'productTermIdsAllowed')
60
- return True if any([
61
- _ALLOW_ALL in allowed_values,
62
- len(values) == 0
63
- ]) else any([value in allowed_values for value in values])
68
+ values = _blank_node_term_values(products)
69
+ return _is_model_value_allowed(model, term_id, values, 'productTermIdsAllowed')
64
70
 
65
71
 
66
72
  @lru_cache()
@@ -73,68 +79,76 @@ def _allowed_mapping(term_id: str, column: str):
73
79
  return (value or _ALLOW_ALL).split(';') if isinstance(value, str) else _ALLOW_ALL
74
80
 
75
81
 
82
+ def _is_term_value_allowed(term_id: str, values: list, lookup_column: str):
83
+ allowed_values = _allowed_mapping(term_id, lookup_column)
84
+ return any([
85
+ _ALLOW_ALL in allowed_values,
86
+ len(values) == 0
87
+ ]) or any([value in allowed_values for value in values])
88
+
89
+
76
90
  def is_siteType_allowed(data: dict, term_id: str):
77
- site_types = _get_site_types(data)
78
- allowed_values = _allowed_mapping(term_id, 'siteTypesAllowed')
79
- return True if _ALLOW_ALL in allowed_values or not site_types else any([
80
- (site_type in allowed_values) for site_type in site_types
81
- ])
91
+ values = _get_site_types(data)
92
+ return _is_term_value_allowed(term_id, values, 'siteTypesAllowed')
82
93
 
83
94
 
84
95
  def is_site_measurement_id_allowed(data: dict, term_id: str):
85
96
  measurements = _get_site_measurements(data)
86
- values = non_empty_list([v.get('term', {}).get('@id') for v in measurements])
87
- allowed_values = _allowed_mapping(term_id, 'siteMeasurementIdsAllowed')
88
- return True if any([
89
- _ALLOW_ALL in allowed_values,
90
- len(values) == 0
91
- ]) else any([value in allowed_values for value in values])
97
+ values = _blank_node_term_values(measurements, key='@id')
98
+ return _is_term_value_allowed(term_id, values, 'siteMeasurementIdsAllowed')
92
99
 
93
100
 
94
101
  def is_product_termType_allowed(data: dict, term_id: str):
95
102
  products = data.get('products', [])
96
- values = non_empty_list([p.get('term', {}).get('termType') for p in products])
97
- allowed_values = _allowed_mapping(term_id, 'productTermTypesAllowed')
98
- return True if any([
99
- _ALLOW_ALL in allowed_values,
100
- len(values) == 0
101
- ]) else any([value in allowed_values for value in values])
103
+ values = _blank_node_term_values(products, key='termType')
104
+ return _is_term_value_allowed(term_id, values, 'productTermTypesAllowed')
102
105
 
103
106
 
104
107
  def is_product_id_allowed(data: dict, term_id: str):
105
108
  products = data.get('products', [])
106
- values = non_empty_list([p.get('term', {}).get('@id') for p in products])
107
- allowed_values = _allowed_mapping(term_id, 'productTermIdsAllowed')
108
- return True if any([
109
- _ALLOW_ALL in allowed_values,
110
- len(values) == 0
111
- ]) else any([value in allowed_values for value in values])
109
+ values = _blank_node_term_values(products, key='@id')
110
+ return _is_term_value_allowed(term_id, values, 'productTermIdsAllowed')
112
111
 
113
112
 
114
113
  def is_input_termType_allowed(data: dict, term_id: str):
115
114
  inputs = data.get('inputs', [])
116
- values = non_empty_list([p.get('term', {}).get('termType') for p in inputs])
117
- allowed_values = _allowed_mapping(term_id, 'inputTermTypesAllowed')
118
- return True if any([
119
- _ALLOW_ALL in allowed_values,
120
- len(values) == 0
121
- ]) else any([value in allowed_values for value in values])
115
+ values = _blank_node_term_values(inputs, key='termType')
116
+ return _is_term_value_allowed(term_id, values, 'inputTermTypesAllowed')
122
117
 
123
118
 
124
119
  def is_input_id_allowed(data: dict, term_id: str):
125
120
  inputs = data.get('inputs', [])
126
- values = non_empty_list([p.get('term', {}).get('@id') for p in inputs])
127
- allowed_values = _allowed_mapping(term_id, 'inputTermIdsAllowed')
128
- return True if any([
129
- _ALLOW_ALL in allowed_values,
130
- len(values) == 0
131
- ]) else any([value in allowed_values for value in values])
121
+ values = _blank_node_term_values(inputs, key='@id')
122
+ return _is_term_value_allowed(term_id, values, 'inputTermIdsAllowed')
123
+
124
+
125
+ def is_practice_termType_allowed(data: dict, term_id: str):
126
+ practices = data.get('practices', [])
127
+ values = _blank_node_term_values(practices, key='termType')
128
+ return _is_term_value_allowed(term_id, values, 'practiceTermTypesAllowed')
129
+
130
+
131
+ def is_practice_id_allowed(data: dict, term_id: str):
132
+ practices = data.get('practices', [])
133
+ values = _blank_node_term_values(practices, key='@id')
134
+ return _is_term_value_allowed(term_id, values, 'practiceTermIdsAllowed')
135
+
136
+
137
+ def is_transformation_termType_allowed(data: dict, term_id: str):
138
+ is_transformation = data.get('@type', data.get('type')) == SchemaType.TRANSFORMATION.value
139
+ values = non_empty_list([data.get('term', {}).get('termType')])
140
+ return not is_transformation or _is_term_value_allowed(term_id, values, 'transformationTermTypesAllowed')
141
+
142
+
143
+ def is_transformation_id_allowed(data: dict, term_id: str):
144
+ is_transformation = data.get('@type', data.get('type')) == SchemaType.TRANSFORMATION.value
145
+ values = non_empty_list([data.get('term', {}).get('@id')])
146
+ return not is_transformation or _is_term_value_allowed(term_id, values, 'transformationTermIdsAllowed')
132
147
 
133
148
 
134
149
  def is_node_type_allowed(data: dict, term_id: str):
135
- node_type = data.get('@type', data.get('type'))
136
- allowed_types = _allowed_mapping(term_id, 'typesAllowed')
137
- return True if _ALLOW_ALL in allowed_types or not node_type else node_type in allowed_types
150
+ values = non_empty_list([data.get('@type', data.get('type'))])
151
+ return _is_term_value_allowed(term_id, values, 'typesAllowed')
138
152
 
139
153
 
140
154
  @lru_cache()
@@ -1,5 +1,6 @@
1
1
  import json
2
2
  import numpy as np
3
+ from hestia_earth.schema import EmissionMethodTier
3
4
 
4
5
 
5
6
  EXCLUDE_FIELDS = ["@type", "type", "@context"]
@@ -33,3 +34,18 @@ def _is_scalar_list(value):
33
34
  all_scalar = False
34
35
  break
35
36
  return all_scalar
37
+
38
+
39
+ def _filter_not_relevant(blank_node: dict):
40
+ return blank_node.get('methodTier') != EmissionMethodTier.NOT_RELEVANT.value
41
+
42
+
43
+ def _filter_emissions_not_relevant(node: dict):
44
+ """
45
+ Ignore all emissions where `methodTier=not relevant` so save space.
46
+ """
47
+ return node | ({
48
+ key: list(filter(_filter_not_relevant, node[key]))
49
+ for key in ['emissions', 'emissionsResourceUse']
50
+ if key in node
51
+ })
@@ -8,7 +8,7 @@ from flatten_json import flatten as flatten_json
8
8
 
9
9
  # __package__ = "hestia_earth.utils" # required to run interactively in vscode
10
10
  from ..api import find_term_ids_by_names
11
- from ._shared import EXCLUDE_FIELDS, EXCLUDE_PRIVATE_FIELDS, _with_csv_formatting
11
+ from ._shared import EXCLUDE_FIELDS, EXCLUDE_PRIVATE_FIELDS, _with_csv_formatting, _filter_emissions_not_relevant
12
12
 
13
13
 
14
14
  PANDAS_IMPORT_ERROR_MSG = "Run `pip install pandas>=1.2` to use this functionality"
@@ -293,7 +293,7 @@ def pivot_nodes(nodes: list[dict]):
293
293
  Pivot array of nodes in dict format (e.g under the 'nodes' key of a .hestia file)
294
294
  The nodes json should first be parsed using _with_csv_formatting for output as csv.
295
295
  """
296
- df_in = nodes_to_df(nodes)
296
+ df_in = nodes_to_df(list(map(_filter_emissions_not_relevant, nodes)))
297
297
 
298
298
  regex = rf".*\.({'|'.join(EXCLUDE_FIELDS + EXCLUDE_PRIVATE_FIELDS)})$"
299
299
  df_in.drop(df_in.filter(regex=regex).columns, axis=1, inplace=True)
@@ -5,7 +5,8 @@ from flatten_json import flatten, unflatten_list
5
5
  from collections import defaultdict
6
6
  from copy import deepcopy
7
7
 
8
- from ._shared import EXCLUDE_FIELDS, EXCLUDE_PRIVATE_FIELDS, _with_csv_formatting
8
+ from hestia_earth.utils.pipeline import _node_type
9
+ from ._shared import EXCLUDE_FIELDS, EXCLUDE_PRIVATE_FIELDS, _with_csv_formatting, _filter_emissions_not_relevant
9
10
 
10
11
  pivot_exclude_fields = Term().fields
11
12
  pivot_exclude_fields.update({k: "" for k in EXCLUDE_FIELDS} | {k: "" for k in EXCLUDE_PRIVATE_FIELDS})
@@ -52,7 +53,7 @@ def _base_pivoted_value(key: str, value, is_top_level: bool):
52
53
 
53
54
  def _do_pivot(node, parent_node_type=None, parent_field=None, level=0): # noqa: C901
54
55
  # print('\ninput node', level, node, '\n')
55
- node_type = node.get("@type", node.get("type"))
56
+ node_type = _node_type(node)
56
57
  if node_type not in ADAPTED_UNIQUENESS_FIELDS:
57
58
  return node
58
59
  pivoted_node = {
@@ -206,6 +207,13 @@ def _do_pivot(node, parent_node_type=None, parent_field=None, level=0): # noqa:
206
207
  return pivoted_node
207
208
 
208
209
 
210
+ def pivot_node(node: dict):
211
+ """
212
+ Pivot single node in dict format parsed with object_hook=_with_csv_formatting
213
+ """
214
+ return _do_pivot(_filter_emissions_not_relevant(node))
215
+
216
+
209
217
  def pivot_json_node(json_node: str):
210
218
  """
211
219
  Pivot single schema-compliant unparsed json string node
@@ -227,11 +235,3 @@ def pivot_nodes(nodes: list[dict]):
227
235
  Pivot multiple nodes in dict format parsed with object_hook=_with_csv_formatting
228
236
  """
229
237
  return [pivot_node(node) for node in nodes]
230
-
231
-
232
- def pivot_node(node: dict):
233
- """
234
- Pivot single node in dict format parsed with object_hook=_with_csv_formatting
235
- """
236
- pivoted_node = _do_pivot(node)
237
- return pivoted_node
@@ -0,0 +1 @@
1
+ VERSION = '0.15.15'
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: hestia-earth-utils
3
- Version: 0.15.13
3
+ Version: 0.15.15
4
4
  Summary: HESTIA's utils library
5
5
  Home-page: https://gitlab.com/hestia-earth/hestia-utils
6
6
  Author: HESTIA Team
@@ -1 +0,0 @@
1
- VERSION = '0.15.13'