PyPI - climate-ref-ilamb - Versions diffs - 0.6.5__py3-none-any.whl → 0.7.0__py3-none-any.whl - Mend

climate-ref-ilamb 0.6.5py3-none-any.whl → 0.7.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

climate_ref_ilamb/configure/ilamb.yaml CHANGED Viewed

@@ -25,7 +25,7 @@ mrsos-WangMao:
     mrsol: ilamb/mrsol/WangMao/mrsol_olc.nc
   alternate_vars:
   - mrsos
-  transform:
+  transforms:
   - select_depth:
       value: 0
   - soil_moisture_to_vol_fraction

climate_ref_ilamb/configure/iomb.yaml CHANGED Viewed

@@ -5,7 +5,7 @@ thetao-WOA2023-surface:
     # TODO: Update to use the obs4REF equiv
     thetao: ilamb/WOA/thetao_mon_WOA_A5B4_gn_200501-201412.nc
   variable_cmap: Reds
-  transform:
+  transforms:
   - select_depth:
       value: 0
   alternate_vars:
@@ -15,7 +15,7 @@ so-WOA2023-surface:
   sources:
     # TODO: Update to use the obs4REF equiv
     so: ilamb/WOA/so_mon_WOA_A5B4_gn_200501-201412.nc
-  transform:
+  transforms:
   - select_depth:
       value: 0
   variable_cmap: YlGn
@@ -27,7 +27,7 @@ amoc-RAPID:
   - timeseries
   related_vars:
   - msftmz
-  transform:
+  transforms:
   - msftmz_to_rapid
   sources:
     # TODO: Update to use the obs4REF equiv
@@ -39,10 +39,10 @@ ohc-NOAA:
   related_vars:
   - thetao
   - volcello
-  transform:
+  transforms:
   - select_depth:
-      min: 0
-      max: 2000
+      vmin: 0
+      vmax: 2000
   - ocean_heat_content:
       reference_year: 2005
   analyses:

climate_ref_ilamb/standard.py CHANGED Viewed

@@ -1,14 +1,15 @@
 from pathlib import Path
 from typing import Any
-import ilamb3  # type: ignore
-import ilamb3.regions as ilr  # type: ignore
-import matplotlib.pyplot as plt
+import dask.config
+import ilamb3
+import ilamb3.regions as ilr
 import pandas as pd
 import pooch
+import xarray as xr
 from ilamb3 import run
-from climate_ref_core.constraints import AddSupplementaryDataset
+from climate_ref_core.constraints import AddSupplementaryDataset, RequireFacets
 from climate_ref_core.dataset_registry import dataset_registry_manager
 from climate_ref_core.datasets import FacetFilter, SourceDatasetType
 from climate_ref_core.diagnostics import (
@@ -17,8 +18,9 @@ from climate_ref_core.diagnostics import (
     ExecutionDefinition,
     ExecutionResult,
 )
+from climate_ref_core.metric_values.typing import SeriesMetricValue
 from climate_ref_core.pycmec.metric import CMECMetric
-from climate_ref_core.pycmec.output import CMECOutput
+from climate_ref_core.pycmec.output import CMECOutput, OutputCV
 from climate_ref_ilamb.datasets import (
     registry_to_collection,
 )
@@ -101,16 +103,7 @@ def _build_cmec_bundle(df: pd.DataFrame) -> dict[str, Any]:
     # reference_df = df[df["source"] == "Reference"]
     model_df = df[df["source"] != "Reference"]
-    # Source is formatted as "ACCESS-ESM1-5-r1i1p1f1-gn"
-    # This assumes that the member_id and grid_label are always the last two parts of the source string
-    # and don't contain '-'
-    extracted_source = model_df.source.str.extract(r"([\w-]+)-([\w\d]+)-([\w\d]+)")
-    model_df.loc[:, "source_id"] = extracted_source[0]
-    model_df.loc[:, "member_id"] = extracted_source[1]
-    model_df.loc[:, "grid_label"] = extracted_source[2]
-    # Strip out units from the name
-    # These are available in the attributes
+    # Strip out units from the name (available in the attributes)
     extracted_source = model_df.name.str.extract(r"(.*)\s\[.*\]")
     model_df.loc[:, "name"] = extracted_source[0]
@@ -149,25 +142,21 @@ def _build_cmec_bundle(df: pd.DataFrame) -> dict[str, Any]:
     return bundle
-def _form_bundles(df: pd.DataFrame) -> tuple[CMECMetric, CMECOutput]:
-    """
-    Create the output bundles (really a lift to make Ruff happy with the size of run()).
-    """
-    metric_bundle = _build_cmec_bundle(df)
-    output_bundle = CMECOutput.create_template()
-    return CMECMetric.model_validate(metric_bundle), CMECOutput.model_validate(output_bundle)
 def _set_ilamb3_options(registry: pooch.Pooch, registry_file: str) -> None:
     """
     Set options for ILAMB based on which registry file is being used.
     """
-    ilamb3.conf.reset()
+    ilamb3.conf.reset()  # type: ignore
     ilamb_regions = ilr.Regions()
     if registry_file == "ilamb":
         ilamb_regions.add_netcdf(registry.fetch("ilamb/regions/GlobalLand.nc"))
         ilamb_regions.add_netcdf(registry.fetch("ilamb/regions/Koppen_coarse.nc"))
         ilamb3.conf.set(regions=["global", "tropical"])
+    # REF's data requirement correctly will add measure data from another
+    # ensemble, but internally I also groupby. Since REF is only giving 1
+    # source_id/member_id/grid_label at a time, relax the groupby option here so
+    # these measures are part of the dataframe in ilamb3.
+    ilamb3.conf.set(comparison_groupby=["source_id", "grid_label"])
 def _load_csv_and_merge(output_directory: Path) -> pd.DataFrame:
@@ -213,29 +202,63 @@ class ILAMBStandard(Diagnostic):
                         facets={
                             "variable_id": (
                                 self.variable_id,
-                                *ilamb_kwargs.get("relationships", {}).keys(),
                                 *ilamb_kwargs.get("alternate_vars", []),
                                 *ilamb_kwargs.get("related_vars", []),
-                            )
+                                *ilamb_kwargs.get("relationships", {}).keys(),
+                            ),
+                            "frequency": "mon",
+                            "experiment_id": ("historical", "land-hist"),
+                            "table_id": (
+                                "AERmonZ",
+                                "Amon",
+                                "CFmon",
+                                "Emon",
+                                "EmonZ",
+                                "LImon",
+                                "Lmon",
+                                "Omon",
+                                "SImon",
+                            ),
                         }
                     ),
-                    FacetFilter(facets={"frequency": ("mon",)}),
-                    FacetFilter(facets={"experiment_id": ("historical", "land-hist")}),
-                    # Exclude unneeded snc tables
-                    FacetFilter(facets={"table_id": ("ImonAnt", "ImonGre")}, keep=False),
                 ),
                 constraints=(
-                    AddSupplementaryDataset.from_defaults("areacella", SourceDatasetType.CMIP6),
-                    AddSupplementaryDataset.from_defaults("sftlf", SourceDatasetType.CMIP6),
-                )
-                if registry_file == "ilamb"
-                else (
-                    AddSupplementaryDataset.from_defaults("areacello", SourceDatasetType.CMIP6),
-                    AddSupplementaryDataset.from_defaults("sftof", SourceDatasetType.CMIP6),
+                    RequireFacets(
+                        "variable_id",
+                        (
+                            self.variable_id,
+                            *ilamb_kwargs.get("alternate_vars", []),
+                            *ilamb_kwargs.get("related_vars", []),
+                        ),
+                        operator="any",
+                    ),
+                    *(
+                        [
+                            RequireFacets(
+                                "variable_id",
+                                required_facets=tuple(ilamb_kwargs.get("relationships", {}).keys()),
+                            )
+                        ]
+                        if "relationships" in ilamb_kwargs
+                        else []
+                    ),
+                    *(
+                        (
+                            AddSupplementaryDataset.from_defaults("areacella", SourceDatasetType.CMIP6),
+                            AddSupplementaryDataset.from_defaults("sftlf", SourceDatasetType.CMIP6),
+                        )
+                        if registry_file == "ilamb"
+                        else (
+                            AddSupplementaryDataset.from_defaults("volcello", SourceDatasetType.CMIP6),
+                            AddSupplementaryDataset.from_defaults("areacello", SourceDatasetType.CMIP6),
+                            AddSupplementaryDataset.from_defaults("sftof", SourceDatasetType.CMIP6),
+                        )
+                    ),
                 ),
-                group_by=("experiment_id",),
+                group_by=("experiment_id", "source_id", "member_id", "grid_label"),
             ),
         )
         self.facets = (
             "experiment_id",
             "source_id",
@@ -257,16 +280,18 @@ class ILAMBStandard(Diagnostic):
         """
         Run the ILAMB standard analysis.
         """
-        plt.rcParams.update({"figure.max_open_warning": 0})
         _set_ilamb3_options(self.registry, self.registry_file)
         ref_datasets = self.ilamb_data.datasets.set_index(self.ilamb_data.slug_column)
-        run.run_simple(
-            ref_datasets,
-            self.slug,
-            definition.datasets[SourceDatasetType.CMIP6].datasets,
-            definition.output_directory,
-            **self.ilamb_kwargs,
-        )
+        # Run ILAMB in a single-threaded mode to avoid issues with multithreading (#394)
+        with dask.config.set(scheduler="synchronous"):
+            run.run_single_block(
+                self.slug,
+                ref_datasets,
+                definition.datasets[SourceDatasetType.CMIP6].datasets,
+                definition.output_directory,
+                **self.ilamb_kwargs,
+            )
     def build_execution_result(self, definition: ExecutionDefinition) -> ExecutionResult:
         """
@@ -281,15 +306,162 @@ class ILAMBStandard(Diagnostic):
         -------
             An execution result object
         """
-        selectors = definition.datasets[SourceDatasetType.CMIP6].selector_dict()
         _set_ilamb3_options(self.registry, self.registry_file)
+        # In ILAMB, scalars are saved in CSV files in the output directory. To
+        # be compatible with the REF system we will need to add the metadata
+        # that is associated with the execution group, called the selector.
         df = _load_csv_and_merge(definition.output_directory)
-        # Add the selectors to the dataframe
-        for key, value in selectors.items():
+        selectors = definition.datasets[SourceDatasetType.CMIP6].selector_dict()
+        # TODO: Fix reference data once we are using the obs4MIPs dataset
+        dataset_source = self.name.split("-")[1] if "-" in self.name else "None"
+        common_dimensions = {**selectors, "reference_source_id": dataset_source}
+        for key, value in common_dimensions.items():
             df[key] = value
-        metric_bundle, output_bundle = _form_bundles(df)
+        metric_bundle = CMECMetric.model_validate(_build_cmec_bundle(df))
+        # Add each png file plot to the output
+        output_bundle = CMECOutput.create_template()
+        for plotfile in definition.output_directory.glob("*.png"):
+            relative_path = str(definition.as_relative_path(plotfile))
+            caption, figure_dimensions = _caption_from_filename(plotfile, common_dimensions)
+            output_bundle[OutputCV.PLOTS.value][relative_path] = {
+                OutputCV.FILENAME.value: relative_path,
+                OutputCV.LONG_NAME.value: caption,
+                OutputCV.DESCRIPTION.value: "",
+                OutputCV.DIMENSIONS.value: figure_dimensions,
+            }
+        # Add the html page to the output
+        index_html = definition.to_output_path("index.html")
+        if index_html.exists():
+            relative_path = str(definition.as_relative_path(index_html))
+            output_bundle[OutputCV.HTML.value][relative_path] = {
+                OutputCV.FILENAME.value: relative_path,
+                OutputCV.LONG_NAME.value: "Results page",
+                OutputCV.DESCRIPTION.value: "Page displaying scalars and plots from the ILAMB execution.",
+                OutputCV.DIMENSIONS.value: common_dimensions,
+            }
+            output_bundle[OutputCV.INDEX.value] = relative_path
+        # Add series to the output based on the time traces we find in the
+        # output files
+        series = []
+        for ncfile in definition.output_directory.glob("*.nc"):
+            ds = xr.open_dataset(ncfile, use_cftime=True)
+            for name, da in ds.items():
+                # Only create series for 1d DataArray's with these dimensions
+                if not (da.ndim == 1 and set(da.dims).intersection(["time", "month"])):
+                    continue
+                # Convert dimension values
+                attrs = {
+                    "units": da.attrs.get("units", ""),
+                    "long_name": da.attrs.get("long_name", str(name)),
+                    "standard_name": da.attrs.get("standard_name", ""),
+                }
+                str_name = str(name)
+                index_name = str(da.dims[0])
+                index = ds[index_name].values.tolist()
+                if hasattr(index[0], "isoformat"):
+                    index = [v.isoformat() for v in index]
+                if hasattr(index[0], "calendar"):
+                    attrs["calendar"] = index[0].calendar
+                # Parse out some dimensions
+                if ncfile.stem == "Reference":
+                    dimensions = {
+                        "source_id": "Reference",
+                        "metric": str_name,
+                    }
+                else:
+                    dimensions = {"metric": str_name, **common_dimensions}
+                # Split the metric into metric and region if possible
+                if "_" in str_name:
+                    dimensions["metric"] = str_name.split("_")[0]
+                    dimensions["region"] = str_name.split("_")[1]
+                else:
+                    dimensions["region"] = "None"
+                series.append(
+                    SeriesMetricValue(
+                        dimensions=dimensions,
+                        values=da.values.tolist(),
+                        index=index,
+                        index_name=index_name,
+                        attributes=attrs,
+                    )
+                )
         return ExecutionResult.build_from_output_bundle(
-            definition, cmec_output_bundle=output_bundle, cmec_metric_bundle=metric_bundle
+            definition, cmec_output_bundle=output_bundle, cmec_metric_bundle=metric_bundle, series=series
         )
+def _caption_from_filename(filename: Path, common_dimensions: dict[str, str]) -> tuple[str, dict[str, str]]:
+    source, region, plot = filename.stem.split("_")
+    plot_texts = {
+        "bias": "bias",
+        "biasscore": "bias score",
+        "cycle": "annual cycle",
+        "cyclescore": "annual cycle score",
+        "mean": "period mean",
+        "rmse": "RMSE",
+        "rmsescore": "RMSE score",
+        "shift": "shift in maximum month",
+        "tmax": "maxmimum month",
+        "trace": "regional mean",
+        "taylor": "Taylor diagram",
+        "distribution": "distribution",
+        "response": "response",
+    }
+    # Name of statistics dimension in CMEC output
+    plot_statistics = {
+        "bias": "Bias",
+        "biasscore": "Bias score",
+        "cycle": "Annual cycle",
+        "cyclescore": "Annual cycle score",
+        "mean": "Period Mean",
+        "rmse": "RMSE",
+        "rmsescore": "RMSE score",
+        "shift": "Shift in maximum month",
+        "tmax": "Maximum month",
+        "trace": "Regional mean",
+        "taylor": "Taylor diagram",
+        "distribution": "Distribution",
+        "response": "Response",
+    }
+    figure_dimensions = {
+        "region": region,
+    }
+    plot_option = None
+    # Some plots have options appended with a dash (distribution-pr, response-tas)
+    if "-" in plot:
+        plot, plot_option = plot.split("-", 1)
+    if plot not in plot_texts:
+        return "", figure_dimensions
+    # Build the caption
+    caption = f"The {plot_texts.get(plot)}"
+    if plot_option is not None:
+        caption += f" of {plot_option}"
+    if source != "None":
+        caption += f" for {'the reference data' if source == 'Reference' else source}"
+    if region.lower() != "none":
+        caption += f" over the {ilr.Regions().get_name(region)} region."
+    # Use the statistic dimension to determine what is being plotted
+    if plot_statistics.get(plot) is not None:
+        figure_dimensions["statistic"] = plot_statistics[plot]
+        if plot_option is not None:
+            figure_dimensions["statistic"] += f"|{plot_option}"
+    # If the source is the reference we don't need some dimensions as they are not applicable
+    if source == "Reference":
+        figure_dimensions["source_id"] = "Reference"
+    else:
+        figure_dimensions = {**common_dimensions, **figure_dimensions}
+    return caption, figure_dimensions

{climate_ref_ilamb-0.6.5.dist-info → climate_ref_ilamb-0.7.0.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: climate-ref-ilamb
-Version: 0.6.5
+Version: 0.7.0
 Summary: ILAMB diagnostic provider for the Rapid Evaluation Framework
 Author-email: Nathan Collier <nathaniel.collier@gmail.com>, Jared Lewis <jared.lewis@climate-resource.com>
 License-Expression: Apache-2.0
@@ -19,7 +19,7 @@ Classifier: Programming Language :: Python :: 3.13
 Classifier: Topic :: Scientific/Engineering
 Requires-Python: >=3.11
 Requires-Dist: climate-ref-core
-Requires-Dist: ilamb3>=2025.5.20
+Requires-Dist: ilamb3>=2025.9.9
 Requires-Dist: scipy<1.16
 Description-Content-Type: text/markdown

{climate_ref_ilamb-0.6.5.dist-info → climate_ref_ilamb-0.7.0.dist-info}/RECORD RENAMED Viewed

@@ -1,15 +1,15 @@
 climate_ref_ilamb/__init__.py,sha256=hMEkSjBY3yo-EbdMNOIvMSdGK14G2s5PERmWrBEtzFk,1414
 climate_ref_ilamb/datasets.py,sha256=MVCt1pxV5dIfYLm6huC0BZWP5stCamYNwXzc7kKW5AI,799
 climate_ref_ilamb/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-climate_ref_ilamb/standard.py,sha256=rMI-GERTn_rg6qkp7jvzFZVAc7AZHkknEtNYFbo-Bak,10556
-climate_ref_ilamb/configure/ilamb.yaml,sha256=4lzZhtn4nq4hV0qjXq9mWlN2cqIkhh_ICtYlL4gtW3k,1194
-climate_ref_ilamb/configure/iomb.yaml,sha256=PxJAivXKNiYp-HbaYOJgUO8LnL9fmSztQKxLM_jFyvQ,944
+climate_ref_ilamb/standard.py,sha256=oz1J6lbjg0kqG2vkTgSIrd_t7yDud1HiLIILeStL5Ig,17873
+climate_ref_ilamb/configure/ilamb.yaml,sha256=keUmj7Oih-AepogB7PTwN56DTb0K0k_x1CkSbbhZjJ0,1195
+climate_ref_ilamb/configure/iomb.yaml,sha256=AQ4MZFDeD4Sw-yDnLb4C-ID2JFk9jfhk_2UPUHTyH78,950
 climate_ref_ilamb/dataset_registry/ilamb.txt,sha256=_zqrq-Sa-0NTjPDFX6nQIeUalEc7tPrKr_CssOBlseg,1030
 climate_ref_ilamb/dataset_registry/iomb.txt,sha256=b95CUBYEGfeoPyRGx_E267c-2GF-E_lc4XeFkNSOJMo,375
 climate_ref_ilamb/dataset_registry/test.txt,sha256=gBjUJ6W-crghYqKN0QOFmjyqpMxKK50dU3SYTuIA6jM,206
-climate_ref_ilamb-0.6.5.dist-info/METADATA,sha256=OKlmtX3Tp7e5hb_tBdj_qOBl_qbH7PjlTBYQerZyS64,2343
-climate_ref_ilamb-0.6.5.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
-climate_ref_ilamb-0.6.5.dist-info/entry_points.txt,sha256=SnRhJk7KRiGd3jL4OMA2SId5p838T95kGcVrr3wtZAQ,59
-climate_ref_ilamb-0.6.5.dist-info/licenses/LICENCE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
-climate_ref_ilamb-0.6.5.dist-info/licenses/NOTICE,sha256=4qTlax9aX2-mswYJuVrLqJ9jK1IkN5kSBqfVvYLF3Ws,128
-climate_ref_ilamb-0.6.5.dist-info/RECORD,,
+climate_ref_ilamb-0.7.0.dist-info/METADATA,sha256=ECoWJL9GEKTyyvrRunXcuO4e7oReRnu-suHyHxqQeTo,2342
+climate_ref_ilamb-0.7.0.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
+climate_ref_ilamb-0.7.0.dist-info/entry_points.txt,sha256=SnRhJk7KRiGd3jL4OMA2SId5p838T95kGcVrr3wtZAQ,59
+climate_ref_ilamb-0.7.0.dist-info/licenses/LICENCE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
+climate_ref_ilamb-0.7.0.dist-info/licenses/NOTICE,sha256=4qTlax9aX2-mswYJuVrLqJ9jK1IkN5kSBqfVvYLF3Ws,128
+climate_ref_ilamb-0.7.0.dist-info/RECORD,,

{climate_ref_ilamb-0.6.5.dist-info → climate_ref_ilamb-0.7.0.dist-info}/WHEEL RENAMED Viewed

File without changes

{climate_ref_ilamb-0.6.5.dist-info → climate_ref_ilamb-0.7.0.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{climate_ref_ilamb-0.6.5.dist-info → climate_ref_ilamb-0.7.0.dist-info}/licenses/LICENCE RENAMED Viewed

File without changes

{climate_ref_ilamb-0.6.5.dist-info → climate_ref_ilamb-0.7.0.dist-info}/licenses/NOTICE RENAMED Viewed

File without changes

climate-ref-ilamb 0.6.5__py3-none-any.whl → 0.7.0__py3-none-any.whl

climate-ref-ilamb 0.6.5py3-none-any.whl → 0.7.0py3-none-any.whl