PyPI - hestia-earth-models - Versions diffs - 0.74.8__py3-none-any.whl → 0.74.9__py3-none-any.whl - Mend

hestia-earth-models 0.74.8py3-none-any.whl → 0.74.9py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (48) hide show

hestia_earth/models/cache_sites.py CHANGED Viewed

@@ -3,11 +3,11 @@ from enum import Enum
 from pydash.objects import merge
 from hestia_earth.schema import TermTermType
 from hestia_earth.utils.tools import flatten, non_empty_list
+from hestia_earth.utils.term import download_term
 from .log import logger
 from .utils import CACHE_KEY, cached_value
 from .utils.site import CACHE_YEARS_KEY
-from .utils.term import download_term
 from .site.pre_checks.cache_geospatialDatabase import (
     list_vectors, list_rasters, cache_site_results, _should_run
 )

hestia_earth/models/faostat2018/liveweightPerHead.py CHANGED Viewed

@@ -2,10 +2,10 @@ from hestia_earth.schema import TermTermType
 from hestia_earth.utils.lookup import extract_grouped_data_closest_date
 from hestia_earth.utils.model import filter_list_term_type
 from hestia_earth.utils.tools import non_empty_list, safe_parse_date, safe_parse_float
+from hestia_earth.utils.term import download_term
 from hestia_earth.models.log import logRequirements, logShouldRun
 from hestia_earth.models.utils.constant import Units
-from hestia_earth.models.utils.term import download_term
 from hestia_earth.models.utils.property import _new_property, node_has_no_property
 from hestia_earth.models.utils.product import convert_product_to_unit
 from hestia_earth.models.utils.animalProduct import FAO_LOOKUP_COLUMN, get_animalProduct_lookup_value

hestia_earth/models/faostat2018/product/price.py CHANGED Viewed

@@ -1,10 +1,10 @@
 from hestia_earth.schema import TermTermType
 from hestia_earth.utils.lookup import extract_grouped_data
 from hestia_earth.utils.tools import non_empty_list, safe_parse_float, safe_parse_date
+from hestia_earth.utils.term import download_term
 from hestia_earth.models.log import debugValues, logRequirements, logShouldRun
 from hestia_earth.models.utils.constant import Units
-from hestia_earth.models.utils.term import download_term
 from hestia_earth.models.utils.currency import DEFAULT_CURRENCY
 from hestia_earth.models.utils.crop import FAOSTAT_PRODUCTION_LOOKUP_COLUMN, get_crop_grouping_faostat_production
 from hestia_earth.models.utils.animalProduct import FAO_LOOKUP_COLUMN, get_animalProduct_grouping_fao

hestia_earth/models/geospatialDatabase/ecoClimateZone.py CHANGED Viewed

@@ -77,4 +77,4 @@ def _should_run(site: dict):
     return should_run
-def run(site: dict): return _run(site) if _should_run(site) else _run_default(site)
+def run(site: dict): return (_run(site) if _should_run(site) else []) or _run_default(site)

hestia_earth/models/geospatialDatabase/region.py CHANGED Viewed

@@ -1,9 +1,9 @@
 from hestia_earth.schema import TermTermType
 from hestia_earth.utils.model import linked_node
+from hestia_earth.utils.term import download_term
 from hestia_earth.models.log import debugValues, logRequirements, logShouldRun
 from .utils import download, has_coordinates
-from hestia_earth.models.utils.term import download_term
 from . import MODEL
 REQUIREMENTS = {

hestia_earth/models/geospatialDatabase/utils.py CHANGED Viewed

@@ -4,10 +4,10 @@ from area import area
 from functools import reduce, lru_cache
 from hestia_earth.schema import TermTermType
 from hestia_earth.utils.tools import non_empty_list
+from hestia_earth.utils.term import download_term
 from hestia_earth.models.log import debugValues, logErrorRun, logRequirements
 from hestia_earth.models.utils.site import cached_value, region_factor, region_level_1_id
-from hestia_earth.models.utils.term import download_term
 from . import MODEL
 MAX_AREA_SIZE = int(os.getenv('MAX_AREA_SIZE', '5000'))

hestia_earth/models/globalCropWaterModel2008/rootingDepth.py CHANGED Viewed

@@ -1,10 +1,11 @@
 from hestia_earth.schema import CycleFunctionalUnit, TermTermType
 from hestia_earth.utils.model import find_term_match, filter_list_term_type
 from hestia_earth.utils.tools import list_sum, non_empty_list, safe_parse_float
+from hestia_earth.utils.term import download_term
 from hestia_earth.models.log import logRequirements, logShouldRun
 from hestia_earth.models.utils.property import _new_property, node_has_no_property
-from hestia_earth.models.utils.term import get_irrigation_terms, download_term
+from hestia_earth.models.utils.term import get_irrigation_terms
 from hestia_earth.models.utils.crop import get_crop_lookup_value
 from hestia_earth.models.utils.completeness import _is_term_type_complete
 from . import MODEL

hestia_earth/models/haversineFormula/transport/distance.py CHANGED Viewed

@@ -1,10 +1,10 @@
 from haversine import haversine
 from hestia_earth.schema import TermTermType
 from hestia_earth.utils.tools import non_empty_list
+from hestia_earth.utils.term import download_term
 from hestia_earth.models.log import logRequirements, logShouldRun, debugValues
 from hestia_earth.models.utils.method import include_methodModel
-from hestia_earth.models.utils.term import download_term
 from .. import MODEL
 REQUIREMENTS = {

hestia_earth/models/hestia/aboveGroundCropResidue.py CHANGED Viewed

@@ -112,12 +112,10 @@ def _run(cycle: dict, total_values: list):
         if value == 0:
             values.extend([_product(term_id, value)])
-        elif remaining_value > 0 and value is not None and value >= 0:
+        elif remaining_value >= 0 and value is not None and value >= 0:
             value = value if value < remaining_value else remaining_value
             values.extend([_product(term_id, value)])
             remaining_value = remaining_value - value
-            if remaining_value == 0:
-                break
     return values + [
         # whatever remains is "left on field"

hestia_earth/models/hestia/cropResidueManagement.py CHANGED Viewed

@@ -21,6 +21,7 @@ RETURNS = {
     }]
 }
 MODEL_KEY = 'cropResidueManagement'
+TERM_ID = 'residueBurnt,residueIncorporated,residueLeftOnField,residueRemoved,residueIncorporatedLessThan30DaysBeforeCultivation,residueIncorporatedMoreThan30DaysBeforeCultivation'  # noqa: E501
 PRACTICE_IDS = [
     residueBurnt.TERM_ID,
     residueIncorporated.TERM_ID,

hestia_earth/models/hestia/excretaKgMass.py CHANGED Viewed

@@ -1,10 +1,10 @@
 from hestia_earth.schema import NodeType, TermTermType
 from hestia_earth.utils.model import filter_list_term_type, find_term_match
 from hestia_earth.utils.tools import non_empty_list, list_sum
+from hestia_earth.utils.term import download_term
 from hestia_earth.models.log import debugValues, logRequirements, logShouldRun
 from hestia_earth.models.utils import get_kg_term_id, get_kg_N_term_id, get_kg_VS_term_id, _filter_list_term_unit
-from hestia_earth.models.utils.term import download_term
 from hestia_earth.models.utils.constant import Units
 from hestia_earth.models.utils.product import _new_product, convert_product_to_unit
 from . import MODEL

hestia_earth/models/hestia/landCover.py CHANGED Viewed

@@ -10,7 +10,7 @@ from hestia_earth.utils.model import filter_list_term_type
 from hestia_earth.utils.tools import safe_parse_float, to_precision
 from hestia_earth.models.log import logRequirements, log_as_table, logShouldRun
-from hestia_earth.models.utils import _omit
+from hestia_earth.models.utils import _omit, clamp
 from hestia_earth.models.utils.constant import DAYS_IN_YEAR
 from hestia_earth.models.utils.management import _new_management
 from hestia_earth.models.utils.term import get_lookup_value
@@ -896,11 +896,15 @@ def _should_run_historical_land_use_change_single_crop(
         land_use_type=land_use_type,
         permanent_crops_net_expansion=permanent_crops_net_expansion
     )
+    capped_expansion_factor = clamp(
+        value=expansion_factor * e9_net_expansion * net_expansion_cultivated_vs_harvested,
+        min_value=0,
+        max_value=1
+    )
     site_area = {
-        land_type: (
-           shares_of_expansion[land_type] * expansion_factor * e9_net_expansion * net_expansion_cultivated_vs_harvested
-        ) for land_type in LAND_USE_TERMS_FOR_TRANSFORMATION.keys()
+        land_type: (shares_of_expansion[land_type] * capped_expansion_factor)
+        for land_type in LAND_USE_TERMS_FOR_TRANSFORMATION.keys()
         if land_type != land_use_type
     }
     site_area[land_use_type] = 1 - sum(site_area.values())
@@ -941,6 +945,9 @@ def _get_land_use_term_from_node(node: dict):
     return _get_lookup_with_cache(lookup_term=node.get("term", {}), column=LOOKUPS.get("landCover")[1])
+def _date_strip(date: str): return date[:10] if date else None
 def _collect_land_use_types(nodes: list) -> list:
     """Look up the land use type from management nodes."""
     return [
@@ -949,8 +956,8 @@ def _collect_land_use_types(nodes: list) -> list:
             "term": node.get("term", {}),
             "id": node.get("term", {}).get("@id"),
             "land-use-type": _get_land_use_term_from_node(node),
-            "endDate": _gapfill_datestr(datestr=node.get("endDate"), mode=DatestrGapfillMode.END)[:10],
-            "startDate": _gapfill_datestr(datestr=node.get("startDate"), mode=DatestrGapfillMode.START)[:10]
+            "endDate": _date_strip(_gapfill_datestr(datestr=node.get("endDate"), mode=DatestrGapfillMode.END)),
+            "startDate": _date_strip(_gapfill_datestr(datestr=node.get("startDate"), mode=DatestrGapfillMode.START))
         } for node in nodes
     ]

hestia_earth/models/hestia/landOccupationDuringCycle.py CHANGED Viewed

@@ -212,7 +212,7 @@ def _format_inventory(inventory: list[SiteData], default: str = "None") -> str:
 def _should_run(impact_assessment: dict):
-    cycle = impact_assessment.get("cycle")
+    cycle = impact_assessment.get("cycle", {})
     functional_unit = cycle.get("functionalUnit")
     product = get_product(impact_assessment)

hestia_earth/models/hestia/management.py CHANGED Viewed

@@ -286,7 +286,7 @@ def _dates_overlap(target_practice: dict, node: dict, cycle: dict, site_type_id:
     ])
-def _should_run_practice(management_nodes: list, cycle: dict, site_type_id: str):
+def _should_run_practice(site: dict, management_nodes: list, cycle: dict, site_type_id: str):
     """
     Include only landUseManagement practices where GAP_FILL_TO_MANAGEMENT = True
     """
@@ -297,21 +297,34 @@ def _should_run_practice(management_nodes: list, cycle: dict, site_type_id: str)
         for node in filter_list_term_type(management_nodes, TermTermType.LANDCOVER)
     ]
-    def run(practice: dict):
+    def exec(practice: dict):
         term = practice.get('term', {})
-        target_group = get_lookup_value(practice.get("term", {}), 'sumIs100Group', skip_debug=True, model=MODEL)
-        has_other_land_cover_in_same_group = next((
+        term_id = term['@id']
+        should_gap_fill = term.get('termType') != TermTermType.LANDUSEMANAGEMENT.value or _should_gap_fill(term)
+        target_group = get_lookup_value(term, 'sumIs100Group', skip_debug=True, model=MODEL)
+        no_other_land_cover_in_same_group = next((
             True for node in landCover_management_nodes
             if (
                 node['sumIs100Group'] == target_group and
                 _dates_overlap(target_practice=practice, node=node, cycle=cycle, site_type_id=site_type_id)
             )
-        ), None) is not None
-        return (
-            (term.get('termType') != TermTermType.LANDUSEMANAGEMENT.value or _should_gap_fill(term)) and
-            not has_other_land_cover_in_same_group
-        )
-    return run
+        ), None) is None
+        # cannot gap-fill landCover without a `startDate`
+        has_required_startDate = term.get('termType') != TermTermType.LANDCOVER.value or practice.get('startDate')
+        should_run = all([
+            should_gap_fill,
+            has_required_startDate,
+            no_other_land_cover_in_same_group
+        ])
+        if not should_run:
+            logRequirements(site, model=MODEL, term=term_id, model_key=MODEL_KEY,
+                            should_gap_fill=should_gap_fill,
+                            has_required_startDate=has_required_startDate,
+                            no_other_land_cover_in_same_group=no_other_land_cover_in_same_group)
+            logShouldRun(site, MODEL, term_id, False, model_key=MODEL_KEY)
+        return should_run
+    return exec
 def _run_from_practices(site: dict, cycle: dict, site_type_id: str):
@@ -330,7 +343,8 @@ def _run_from_practices(site: dict, cycle: dict, site_type_id: str):
     ]
     management_nodes = site.get("management", [])
     return list(map(_map_to_value, filter(
-        _should_run_practice(management_nodes=management_nodes, cycle=cycle, site_type_id=site_type_id), practices
+        _should_run_practice(site, management_nodes, cycle, site_type_id),
+        practices
     )))

hestia_earth/models/hestia/pastureGrass.py CHANGED Viewed

@@ -1,9 +1,9 @@
 from hestia_earth.schema import SiteSiteType, TermTermType
 from hestia_earth.utils.model import linked_node
+from hestia_earth.utils.term import download_term
 from hestia_earth.models.log import logRequirements, logShouldRun
 from hestia_earth.models.utils.practice import _new_practice
-from hestia_earth.models.utils.term import download_term
 from . import MODEL
 REQUIREMENTS = {

hestia_earth/models/impact_assessment/post_checks/__init__.py CHANGED Viewed

@@ -2,7 +2,7 @@ from os.path import dirname, abspath
 import sys
 from hestia_earth.models.utils import _run_in_serie
-from . import cycle, site, remove_cache_fields
+from . import cycle, site, remove_cache_fields, remove_no_value
 CURRENT_DIR = dirname(abspath(__file__)) + '/'
 sys.path.append(CURRENT_DIR)
@@ -10,7 +10,8 @@ sys.path.append(CURRENT_DIR)
 MODELS = [
     cycle.run,
     site.run,
-    remove_cache_fields.run
+    remove_cache_fields.run,
+    remove_no_value.run
 ]

hestia_earth/models/impact_assessment/post_checks/remove_no_value.py ADDED Viewed

@@ -0,0 +1,13 @@
+_KEYS = ['impacts', 'endpoints']
+def _has_value(blank_node: dict):
+    return blank_node.get('value') is not None
+def _filter_has_value(impact: dict, key: str):
+    return list(filter(_has_value, impact[key]))
+def run(impact: dict):
+    return impact | {key: _filter_has_value(impact, key) for key in _KEYS if impact.get(key)}

hestia_earth/models/ipcc2019/biocharOrganicCarbonPerHa.py CHANGED Viewed

@@ -110,7 +110,7 @@ def _should_run(site: dict) -> tuple[bool, dict]:
     """
     cycles = related_cycles(site)
     site_type = site.get("siteType")
-    ipcc_soil_category = _assign_ipcc_soil_category(site.get("measurements", []))
+    ipcc_soil_category, soil_logs = _assign_ipcc_soil_category(site.get("measurements", []))
     has_cycles = len(cycles) > 0
     has_valid_site_type = site_type in _VALID_SITE_TYPES
@@ -140,6 +140,7 @@ def _should_run(site: dict) -> tuple[bool, dict]:
         should_compile_inventory=should_compile_inventory,
         seed=seed,
         inventory=_format_inventory(inventory),
+        **soil_logs,
         **_format_logs(logs)
     )

hestia_earth/models/ipcc2019/ch4ToAirExcreta.py CHANGED Viewed

@@ -120,7 +120,10 @@ def _get_ch4_conv_factor(cycle: dict):
                 ecoClimateZone=ecoClimateZone,
                 practice_id=practice_id)
-    return _get_excretaManagement_MCF_from_lookup(practice_id, ecoClimateZone, duration_key) if practice_id else 0
+    return _get_excretaManagement_MCF_from_lookup(practice_id, ecoClimateZone, duration_key) if all([
+        practice_id,
+        ecoClimateZone is not None
+    ]) else 0
 def _should_run(cycle: dict):

hestia_earth/models/ipcc2019/organicCarbonPerHa.py CHANGED Viewed

@@ -23,7 +23,11 @@ REQUIREMENTS = {
         ],
         "optional": {
             "measurements": [
-                {"@type": "Measurement", "value": "", "term.termType": ["soilType", "usdaSoilType"]}
+                {
+                    "@doc": "The model cannot run on sites with more than 30 percent organic soils (`histols`, `histosol` and their subclasses).",  # noqa: E501
+                    "@type": "Measurement", "value": "",
+                    "term.termType": ["soilType", "usdaSoilType"]
+                }
             ],
             "management": [
                 {

hestia_earth/models/ipcc2019/organicCarbonPerHa_tier_1.py CHANGED Viewed

@@ -19,14 +19,16 @@ from hestia_earth.models.utils.blank_node import (
 from hestia_earth.models.utils.ecoClimateZone import EcoClimateZone, get_eco_climate_zone_value
 from hestia_earth.models.utils.measurement import _new_measurement
 from hestia_earth.models.utils.property import get_node_property
-from hestia_earth.models.utils.term import get_residue_removed_or_burnt_terms, get_upland_rice_land_cover_terms
+from hestia_earth.models.utils.term import (
+    get_lookup_value, get_residue_removed_or_burnt_terms, get_upland_rice_land_cover_terms
+)
 from .organicCarbonPerHa_utils import (
-    check_irrigation, DEPTH_LOWER, DEPTH_UPPER, IPCC_SOIL_CATEGORY_TO_SOIL_TYPE_LOOKUP_VALUE,
+    check_irrigation, DEPTH_LOWER, DEPTH_UPPER, format_soil_inventory, IPCC_SOIL_CATEGORY_TO_SOIL_TYPE_LOOKUP_VALUE,
     IPCC_LAND_USE_CATEGORY_TO_LAND_COVER_LOOKUP_VALUE, IPCC_MANAGEMENT_CATEGORY_TO_GRASSLAND_MANAGEMENT_TERM_ID,
     IPCC_MANAGEMENT_CATEGORY_TO_TILLAGE_MANAGEMENT_LOOKUP_VALUE, IpccSoilCategory, IpccCarbonInputCategory,
     IpccLandUseCategory, IpccManagementCategory, is_cover_crop, MIN_AREA_THRESHOLD, sample_constant,
-    sample_plus_minus_error, sample_plus_minus_uncertainty, SITE_TYPE_TO_IPCC_LAND_USE_CATEGORY,
+    sample_plus_minus_error, sample_plus_minus_uncertainty, SITE_TYPE_TO_IPCC_LAND_USE_CATEGORY, SoilData,
     SUPER_MAJORITY_AREA_THRESHOLD, STATS_DEFINITION
 )
 from . import MODEL
@@ -45,7 +47,11 @@ REQUIREMENTS = {
         ],
         "optional": {
             "measurements": [
-                {"@type": "Measurement", "value": "", "term.termType": ["soilType", "usdaSoilType"]}
+                {
+                    "@doc": "This model cannot run on sites with more than 30 percent organic soils (`histols`, `histosol` and their subclasses).",  # noqa: E501
+                    "@type": "Measurement", "value": "",
+                    "term.termType": ["soilType", "usdaSoilType"]
+                }
             ],
             "management": [
                 {
@@ -606,16 +612,19 @@ def should_run(site: dict) -> tuple[bool, dict, dict]:
     measurement_nodes = site.get("measurements", [])
     eco_climate_zone = get_eco_climate_zone_value(site, as_enum=True)
-    ipcc_soil_category = _assign_ipcc_soil_category(measurement_nodes)
+    ipcc_soil_category, soil_logs = _assign_ipcc_soil_category(measurement_nodes)
     soc_ref = _get_soc_ref_preview(ipcc_soil_category, eco_climate_zone)
+    valid_site_type = site_type in _VALID_SITE_TYPES
+    valid_eco_climate_zone = eco_climate_zone not in _EXCLUDED_ECO_CLIMATE_ZONES
+    valid_soc_ref = isinstance(soc_ref, (float, int)) and soc_ref > 0
     has_management = len(management_nodes) > 0
     has_measurements = len(measurement_nodes) > 0
     should_compile_inventory = all([
-        site_type in _VALID_SITE_TYPES,
-        eco_climate_zone not in _EXCLUDED_ECO_CLIMATE_ZONES,
-        soc_ref or -9999 > 0,
+        valid_site_type,
+        valid_eco_climate_zone,
+        valid_soc_ref,
         has_management,
         has_measurements
     ])
@@ -638,9 +647,13 @@ def should_run(site: dict) -> tuple[bool, dict, dict]:
         year for year, group in inventory.items() if group.get(_InventoryKey.SHOULD_RUN)
     )
-    logs = inventory_logs | {
+    logs = soil_logs | inventory_logs | {
         "site_type": site_type,
+        "soc_ref_available": valid_soc_ref,
         "soc_ref": soc_ref,
+        "valid_eco_climate_zone": valid_eco_climate_zone,
+        "valid_soil_category": ipcc_soil_category not in [IpccSoilCategory.ORGANIC_SOILS],
+        "valid_site_type": valid_site_type,
         "has_management": has_management,
         "has_measurements": has_measurements,
         "should_compile_inventory_tier_1": should_compile_inventory,
@@ -1034,24 +1047,34 @@ def _assign_ipcc_soil_category(
     soil_types = _get_soil_type_measurements(measurement_nodes, TermTermType.SOILTYPE)
     usda_soil_types = _get_soil_type_measurements(measurement_nodes, TermTermType.USDASOILTYPE)
+    soil_data = [_unpack_soil_data(node) for node in soil_types]
+    usda_soil_data = [_unpack_soil_data(node) for node in usda_soil_types]
     clay_content = get_node_value(find_term_match(measurement_nodes, _CLAY_CONTENT_TERM_ID))
     sand_content = get_node_value(find_term_match(measurement_nodes, _SAND_CONTENT_TERM_ID))
     has_sandy_soil = clay_content < _CLAY_CONTENT_MAX and sand_content > _SAND_CONTENT_MIN
-    return next(
+    logs = {
+        "soil_data": format_soil_inventory(soil_data),
+        "usda_soil_data": format_soil_inventory(usda_soil_data),
+        "has_sandy_soil_texture": has_sandy_soil
+    }
+    category = next(
         (
             key for key in _SOIL_CATEGORY_DECISION_TREE
-            if _SOIL_CATEGORY_DECISION_TREE[key](
+            if _check_soil_category(
                 key=key,
-                soil_types=soil_types,
-                usda_soil_types=usda_soil_types,
+                soil_data=soil_data,
+                usda_soil_data=usda_soil_data,
                 has_sandy_soil=has_sandy_soil
             )
         ),
         default
     ) if len(soil_types) > 0 or len(usda_soil_types) > 0 else default
+    return category, logs
 def _get_soil_type_measurements(
     nodes: list[dict], term_type: Literal[TermTermType.SOILTYPE, TermTermType.USDASOILTYPE]
@@ -1067,98 +1090,66 @@ def _get_soil_type_measurements(
     )
-def _check_soil_category(
-    *,
-    key: IpccSoilCategory,
-    soil_types: list[dict],
-    usda_soil_types: list[dict],
-    **_
-) -> bool:
-    """
-    Check if the soil category matches the given key.
-    Parameters
-    ----------
-    key : IpccSoilCategory
-        The IPCC soil category to check.
-    soil_types : list[dict]
-        List of soil type measurement nodes.
-    usda_soil_types : list[dict]
-        List of USDA soil type measurement nodes
-    Returns
-    -------
-    bool
-        `True` if the soil category matches, `False` otherwise.
-    """
-    SOIL_TYPE_LOOKUP = LOOKUPS["soilType"]
-    USDA_SOIL_TYPE_LOOKUP = LOOKUPS["usdaSoilType"]
+def _unpack_soil_data(node):
+    term = node.get("term", {})
+    term_id = term.get("@id")
+    term_type = term.get("termType")
+    value = get_node_value(node)
-    target_lookup_values = IPCC_SOIL_CATEGORY_TO_SOIL_TYPE_LOOKUP_VALUE.get(key, None)
+    lookup_value = get_lookup_value(term, LOOKUPS[term_type]) if term_type else None
+    category = next(key for key, value in IPCC_SOIL_CATEGORY_TO_SOIL_TYPE_LOOKUP_VALUE.items() if value == lookup_value)
-    is_soil_type_match = cumulative_nodes_lookup_match(
-        soil_types,
-        lookup=SOIL_TYPE_LOOKUP,
-        target_lookup_values=target_lookup_values,
-        cumulative_threshold=MIN_AREA_THRESHOLD
-    )
+    return SoilData(term_id, value, category)
-    is_usda_soil_type_match = cumulative_nodes_lookup_match(
-        usda_soil_types,
-        lookup=USDA_SOIL_TYPE_LOOKUP,
-        target_lookup_values=target_lookup_values,
-        cumulative_threshold=MIN_AREA_THRESHOLD
-    )
-    return is_soil_type_match or is_usda_soil_type_match
+_IPCC_SOIL_CATEGORY_TO_OVERRIDE_KWARGS = {
+    IpccSoilCategory.SANDY_SOILS: {"has_sandy_soil"}
+}
+"""
+Keyword arguments that can override the `soilType`/`usdaSoilType` lookup match for an `IpccSoilCategory`.
+"""
-def _check_sandy_soil_category(
-    *,
-    key: IpccSoilCategory,
-    soil_types: list[dict],
-    usda_soil_types: list[dict],
-    has_sandy_soil: bool,
-    **_
+def _check_soil_category(
+    *, key: IpccSoilCategory, soil_data: list[SoilData], usda_soil_data: list[SoilData], **kwargs
 ) -> bool:
     """
-    Check if the soils are sandy.
-    This function is special case of `_check_soil_category`.
+    Check if the soil category matches the given key.
     Parameters
     ----------
     key : IpccSoilCategory
         The IPCC soil category to check.
-    soil_types : list[dict]
-        List of soil type measurement nodes.
-    usda_soil_types : list[dict]
-        List of USDA soil type measurement nodes
-    has_sandy_soil : bool
-        True if the soils are sandy, False otherwise.
+    soil_data : list[SoilData]
+        List of `SoilData` NamedEnums generated from `soilType` measurement nodes.
+    usda_soil_data : list[SoilData]
+        List of `SoilData` NamedEnums generated from `usdaSoilType` measurement nodes.
     Returns
     -------
     bool
         `True` if the soil category matches, `False` otherwise.
     """
-    return _check_soil_category(key=key, soil_types=soil_types, usda_soil_types=usda_soil_types) or has_sandy_soil
+    override_kwargs = _IPCC_SOIL_CATEGORY_TO_OVERRIDE_KWARGS.get(key, set())
+    valid_override = any(v for k, v in kwargs.items() if k in override_kwargs)
+    is_soil_match = sum(data.value for data in soil_data if data.category == key) > MIN_AREA_THRESHOLD
+    is_usda_soil_match = sum(data.value for data in usda_soil_data if data.category == key) > MIN_AREA_THRESHOLD
+    return valid_override or is_soil_match or is_usda_soil_match
-_SOIL_CATEGORY_DECISION_TREE = {
-    IpccSoilCategory.ORGANIC_SOILS: _check_soil_category,
-    IpccSoilCategory.SANDY_SOILS: _check_sandy_soil_category,
-    IpccSoilCategory.WETLAND_SOILS: _check_soil_category,
-    IpccSoilCategory.VOLCANIC_SOILS: _check_soil_category,
-    IpccSoilCategory.SPODIC_SOILS: _check_soil_category,
-    IpccSoilCategory.HIGH_ACTIVITY_CLAY_SOILS: _check_soil_category,
-    IpccSoilCategory.LOW_ACTIVITY_CLAY_SOILS: _check_soil_category
-}
-"""
-A decision tree mapping IPCC soil categories to corresponding check functions.
-Key: IpccSoilCategory
-Value: Corresponding function for checking the match of the given soil category based on soil types.
+_SOIL_CATEGORY_DECISION_TREE = [
+    IpccSoilCategory.ORGANIC_SOILS,
+    IpccSoilCategory.SANDY_SOILS,
+    IpccSoilCategory.WETLAND_SOILS,
+    IpccSoilCategory.VOLCANIC_SOILS,
+    IpccSoilCategory.SPODIC_SOILS,
+    IpccSoilCategory.HIGH_ACTIVITY_CLAY_SOILS,
+    IpccSoilCategory.LOW_ACTIVITY_CLAY_SOILS
+]
+"""
+A decision tree determining the order to check IPCC soil categories.
 """
@@ -1201,7 +1192,7 @@ def _assign_ipcc_land_use_category(
     return next(
         (
             key for key in DECISION_TREE
-            if DECISION_TREE[key](
+            if _check_ipcc_land_use_category(
                 key=key,
                 land_cover_nodes=land_cover_nodes,
                 has_long_fallow=has_long_fallow,
@@ -1317,23 +1308,19 @@ Keyword arguments that can override the `landCover` lookup match for specific `I
 """
-_LAND_USE_CATEGORY_DECISION_TREE = {
-    IpccLandUseCategory.GRASSLAND: _check_ipcc_land_use_category,
-    IpccLandUseCategory.SET_ASIDE: _check_ipcc_land_use_category,
-    IpccLandUseCategory.PERENNIAL_CROPS: _check_ipcc_land_use_category,
-    IpccLandUseCategory.PADDY_RICE_CULTIVATION: _check_ipcc_land_use_category,
-    IpccLandUseCategory.ANNUAL_CROPS_WET: _check_ipcc_land_use_category,
-    IpccLandUseCategory.ANNUAL_CROPS: _check_ipcc_land_use_category,
-    IpccLandUseCategory.FOREST: _check_ipcc_land_use_category,
-    IpccLandUseCategory.NATIVE: _check_ipcc_land_use_category,
-    IpccLandUseCategory.OTHER: _check_ipcc_land_use_category
-}
+_LAND_USE_CATEGORY_DECISION_TREE = [
+    IpccLandUseCategory.GRASSLAND,
+    IpccLandUseCategory.SET_ASIDE,
+    IpccLandUseCategory.PERENNIAL_CROPS,
+    IpccLandUseCategory.PADDY_RICE_CULTIVATION,
+    IpccLandUseCategory.ANNUAL_CROPS_WET,
+    IpccLandUseCategory.ANNUAL_CROPS,
+    IpccLandUseCategory.FOREST,
+    IpccLandUseCategory.NATIVE,
+    IpccLandUseCategory.OTHER
+]
 """
-A decision tree mapping IPCC soil categories to corresponding check functions.
-Key: IpccLandUseCategory
-Value: Corresponding function for checking the match of the given land use category based on land cover nodes
-and additional kwargs.
+A decision tree determining the order to check IPCC land use categories.
 """

hestia-earth-models 0.74.8__py3-none-any.whl → 0.74.9__py3-none-any.whl

hestia-earth-models 0.74.8py3-none-any.whl → 0.74.9py3-none-any.whl