PyPI - tobac - Versions diffs - 1.6.2__py3-none-any.whl - Mend

tobac 1.6.2__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (53) hide show

tobac/__init__.py +112 -0
tobac/analysis/__init__.py +31 -0
tobac/analysis/cell_analysis.py +628 -0
tobac/analysis/feature_analysis.py +212 -0
tobac/analysis/spatial.py +619 -0
tobac/centerofgravity.py +226 -0
tobac/feature_detection.py +1758 -0
tobac/merge_split.py +324 -0
tobac/plotting.py +2321 -0
tobac/segmentation/__init__.py +10 -0
tobac/segmentation/watershed_segmentation.py +1316 -0
tobac/testing.py +1179 -0
tobac/tests/segmentation_tests/test_iris_xarray_segmentation.py +0 -0
tobac/tests/segmentation_tests/test_segmentation.py +1183 -0
tobac/tests/segmentation_tests/test_segmentation_time_pad.py +104 -0
tobac/tests/test_analysis_spatial.py +1109 -0
tobac/tests/test_convert.py +265 -0
tobac/tests/test_datetime.py +216 -0
tobac/tests/test_decorators.py +148 -0
tobac/tests/test_feature_detection.py +1321 -0
tobac/tests/test_generators.py +273 -0
tobac/tests/test_import.py +24 -0
tobac/tests/test_iris_xarray_match_utils.py +244 -0
tobac/tests/test_merge_split.py +351 -0
tobac/tests/test_pbc_utils.py +497 -0
tobac/tests/test_sample_data.py +197 -0
tobac/tests/test_testing.py +747 -0
tobac/tests/test_tracking.py +714 -0
tobac/tests/test_utils.py +650 -0
tobac/tests/test_utils_bulk_statistics.py +789 -0
tobac/tests/test_utils_coordinates.py +328 -0
tobac/tests/test_utils_internal.py +97 -0
tobac/tests/test_xarray_utils.py +232 -0
tobac/tracking.py +613 -0
tobac/utils/__init__.py +27 -0
tobac/utils/bulk_statistics.py +360 -0
tobac/utils/datetime.py +184 -0
tobac/utils/decorators.py +540 -0
tobac/utils/general.py +753 -0
tobac/utils/generators.py +87 -0
tobac/utils/internal/__init__.py +2 -0
tobac/utils/internal/coordinates.py +430 -0
tobac/utils/internal/iris_utils.py +462 -0
tobac/utils/internal/label_props.py +82 -0
tobac/utils/internal/xarray_utils.py +439 -0
tobac/utils/mask.py +364 -0
tobac/utils/periodic_boundaries.py +419 -0
tobac/wrapper.py +244 -0
tobac-1.6.2.dist-info/METADATA +154 -0
tobac-1.6.2.dist-info/RECORD +53 -0
tobac-1.6.2.dist-info/WHEEL +5 -0
tobac-1.6.2.dist-info/licenses/LICENSE +29 -0
tobac-1.6.2.dist-info/top_level.txt +1 -0

tobac/tests/test_generators.py ADDED Viewed

@@ -0,0 +1,273 @@
+"""Unit tests for tobac.utils.generators module"""
+from datetime import datetime, timedelta
+import cftime
+import numpy as np
+import pandas as pd
+import pytest
+import xarray as xr
+from pandas.testing import assert_frame_equal
+from tobac.utils import generators
+def test_field_and_features_over_time():
+    """Test iterating over field_and_features_over_time generator"""
+    test_data = xr.DataArray(
+        np.zeros([2, 10, 10]),
+        dims=("time", "y", "x"),
+        coords={"time": [datetime(2000, 1, 1), datetime(2000, 1, 1, 1)]},
+    )
+    test_features = pd.DataFrame(
+        {
+            "feature": [1, 2, 3],
+            "frame": [0, 0, 1],
+            "time": [
+                datetime(2000, 1, 1),
+                datetime(2000, 1, 1),
+                datetime(2000, 1, 1, 1),
+            ],
+        }
+    )
+    iterator = generators.field_and_features_over_time(test_data, test_features)
+    iter_0 = next(iterator)
+    assert iter_0[0] == 0
+    assert iter_0[1] == np.datetime64("2000-01-01")
+    assert np.all(iter_0[2] == test_data.isel(time=0))
+    assert_frame_equal(
+        iter_0[3], test_features[test_features.time == datetime(2000, 1, 1)]
+    )
+    iter_1 = next(iterator)
+    assert iter_1[0] == 1
+    assert iter_1[1] == np.datetime64("2000-01-01 01:00:00")
+    assert np.all(iter_1[2] == test_data.isel(time=1))
+    assert_frame_equal(
+        iter_1[3], test_features[test_features.time == datetime(2000, 1, 1, 1)]
+    )
+    with pytest.raises(StopIteration):
+        next(iterator)
+def test_field_and_features_over_time_no_0_dataframe():
+    """Test that field and features over time works when the dataframe has no 0
+    index value
+    """
+    test_data = xr.DataArray(
+        np.zeros([2, 10, 10]),
+        dims=("time", "y", "x"),
+        coords={"time": [datetime(2000, 1, 1), datetime(2000, 1, 1, 1)]},
+    )
+    test_features = pd.DataFrame(
+        {
+            "feature": [1, 2, 3],
+            "frame": [0, 0, 1],
+            "time": [
+                datetime(2000, 1, 1),
+                datetime(2000, 1, 1),
+                datetime(2000, 1, 1, 1),
+            ],
+        },
+        index=[1, 2, 3],
+    )
+    iterator = generators.field_and_features_over_time(test_data, test_features)
+    iter_0 = next(iterator)
+    assert iter_0[0] == 0
+    assert iter_0[1] == np.datetime64("2000-01-01")
+    assert np.all(iter_0[2] == test_data.isel(time=0))
+    assert_frame_equal(
+        iter_0[3], test_features[test_features.time == datetime(2000, 1, 1)]
+    )
+def test_field_and_features_over_time_time_padding():
+    """Test the time_padding functionality of field_and_features_over_time
+    generator
+    """
+    test_data = xr.DataArray(
+        np.zeros([1, 10, 10]),
+        dims=("time", "y", "x"),
+        coords={"time": [datetime(2000, 1, 1)]},
+    )
+    test_features = pd.DataFrame(
+        {
+            "feature": [1, 2, 3],
+            "frame": [0, 0, 0],
+            "time": [
+                datetime(2000, 1, 1),
+                datetime(2000, 1, 1, 0, 0, 1),
+                datetime(2000, 1, 1, 0, 0, 2),
+            ],
+        }
+    )
+    #  Test no time padding
+    _, _, _, df_slice = next(
+        generators.field_and_features_over_time(test_data, test_features)
+    )
+    assert len(df_slice) == 1
+    assert_frame_equal(df_slice, test_features.loc[0:0])
+    # Test time padding of 1 second
+    _, _, _, df_slice = next(
+        generators.field_and_features_over_time(
+            test_data, test_features, time_padding=timedelta(seconds=1)
+        )
+    )
+    assert len(df_slice) == 2
+    assert_frame_equal(df_slice, test_features.loc[0:1])
+    # Test time padding of 2 seconds
+    _, _, _, df_slice = next(
+        generators.field_and_features_over_time(
+            test_data, test_features, time_padding=timedelta(seconds=2)
+        )
+    )
+    assert len(df_slice) == 3
+    assert_frame_equal(df_slice, test_features.loc[0:2])
+def test_field_and_features_over_time_cftime():
+    """Test field_and_features_over_time when given cftime datetime formats"""
+    test_data = xr.DataArray(
+        np.zeros([2, 10, 10]),
+        dims=("time", "y", "x"),
+        coords={
+            "time": [
+                cftime.Datetime360Day(2000, 1, 1),
+                cftime.Datetime360Day(2000, 1, 1, 1),
+            ]
+        },
+    )
+    test_features = pd.DataFrame(
+        {
+            "feature": [1, 2, 3],
+            "frame": [0, 0, 1],
+            "time": [
+                cftime.Datetime360Day(2000, 1, 1),
+                cftime.Datetime360Day(2000, 1, 1, 0, 0, 1),
+                cftime.Datetime360Day(2000, 1, 1, 1),
+            ],
+        }
+    )
+    iterator = generators.field_and_features_over_time(
+        test_data, test_features, time_padding=timedelta(seconds=1)
+    )
+    iter_0 = next(iterator)
+    assert iter_0[0] == 0
+    assert iter_0[1] == cftime.Datetime360Day(2000, 1, 1)
+    assert np.all(iter_0[2] == test_data.isel(time=0))
+    assert_frame_equal(iter_0[3], test_features.loc[0:1])
+    iter_1 = next(iterator)
+    assert iter_1[0] == 1
+    assert iter_1[1] == cftime.Datetime360Day(2000, 1, 1, 1)
+    assert np.all(iter_1[2] == test_data.isel(time=1))
+    assert_frame_equal(
+        iter_1[3],
+        test_features[test_features.time == cftime.Datetime360Day(2000, 1, 1, 1)],
+    )
+    with pytest.raises(StopIteration):
+        next(iterator)
+def test_field_and_features_over_time_time_var_name():
+    """Test field_and_features_over_time generator works correctly with a time
+    coordinate name other than "time"
+    """
+    # Test non-standard time coord name:
+    test_data = xr.DataArray(
+        np.zeros([2, 10, 10]),
+        dims=("time_testing", "y", "x"),
+        coords={"time_testing": [datetime(2000, 1, 1), datetime(2000, 1, 1, 1)]},
+    )
+    test_features = pd.DataFrame(
+        {
+            "feature": [1, 2, 3],
+            "frame": [0, 0, 1],
+            "time_testing": [
+                datetime(2000, 1, 1),
+                datetime(2000, 1, 1),
+                datetime(2000, 1, 1, 1),
+            ],
+        }
+    )
+    _ = next(
+        generators.field_and_features_over_time(
+            test_data, test_features, time_var_name="time_testing"
+        )
+    )
+def test_field_and_features_over_time_time_var_name_error():
+    """Test that field_and_features_over_time generator raises the correct
+    error when the name of the time coordinates do not match between the given
+    data and dataframe
+    """
+    # Test if time_var_name not in dataarray:
+    test_data = xr.DataArray(
+        np.zeros([2, 10, 10]),
+        dims=("time_testing", "y", "x"),
+        coords={"time_testing": [datetime(2000, 1, 1), datetime(2000, 1, 1, 1)]},
+    )
+    test_features = pd.DataFrame(
+        {
+            "feature": [1, 2, 3],
+            "frame": [0, 0, 1],
+            "time": [
+                datetime(2000, 1, 1),
+                datetime(2000, 1, 1),
+                datetime(2000, 1, 1, 1),
+            ],
+        }
+    )
+    with pytest.raises(ValueError, match="time not present in input field*"):
+        next(generators.field_and_features_over_time(test_data, test_features))
+    # Test if time var name not in dataframe:
+    test_data = xr.DataArray(
+        np.zeros([2, 10, 10]),
+        dims=("time", "y", "x"),
+        coords={"time": [datetime(2000, 1, 1), datetime(2000, 1, 1, 1)]},
+    )
+    test_features = pd.DataFrame(
+        {
+            "feature": [1, 2, 3],
+            "frame": [0, 0, 1],
+            "time_testing": [
+                datetime(2000, 1, 1),
+                datetime(2000, 1, 1),
+                datetime(2000, 1, 1, 1),
+            ],
+        }
+    )
+    with pytest.raises(ValueError, match="time not present in input feature*"):
+        next(generators.field_and_features_over_time(test_data, test_features))

tobac/tests/test_import.py ADDED Viewed

@@ -0,0 +1,24 @@
+import pytest
+import tobac
+def test_dummy_function():
+    assert 1 == 1
+def test_version():
+    """Test to make sure that we have a version number included.
+    Also test to make sure that the version number complies with
+    semantic versioning guidelines.
+    If it's not, this should result in an error.
+    """
+    import re
+    assert type(tobac.__version__) is str
+    # Make sure that we are following semantic versioning
+    # i.e., our version is of form x.x.x, where x are all
+    # integer numbers.
+    assert (
+        re.match(r"[0-9]+\.[0-9]+\.[0-9]+", tobac.__version__) is not None
+        or tobac.__version__ == "unknown_dev_version"
+    )

tobac/tests/test_iris_xarray_match_utils.py ADDED Viewed

@@ -0,0 +1,244 @@
+"""Tests to confirm that xarray and iris pathways work the same and produce the same data
+for the same input datasets.
+"""
+from __future__ import annotations
+import copy
+import datetime
+import iris.cube
+import numpy as np
+import pandas as pd
+import xarray as xr
+import pytest
+import tobac.testing as tbtest
+import tobac.utils.internal.iris_utils as iris_utils
+import tobac.utils.internal.xarray_utils as xr_utils
+import tobac.utils.datetime as datetime_utils
+from tobac.utils.decorators import convert_cube_to_dataarray
+@pytest.mark.parametrize(
+    "feature_positions, coordinates, expected_val",
+    [
+        (
+            ((0, 0, 0), (9, 9, 9)),
+            {"x": ("x", np.linspace(0, 10, 10)), "z": ("z", np.linspace(0, 10, 10))},
+            {"x": (0, 10)},
+        ),
+        (
+            ((0, 0), (9, 9)),
+            {"x": ("x", np.linspace(0, 10, 10))},
+            {"x": (0, 10)},
+        ),
+        (
+            ((0, 0), (9, 9), (5, 7)),
+            {
+                "longitude": ("x", np.linspace(-30, 60, 10)),
+                "latitude": ("y", np.linspace(-70, 20, 10)),
+            },
+            {"latitude": (-70, 20, 0), "longitude": (-30, 60, 20)},
+        ),
+        (
+            ((0, 0), (9, 9), (5, 7), (3.6, 7.9)),
+            {
+                "longitude": (
+                    ("x", "y"),
+                    np.arange(-180, -80).reshape(10, -1),
+                ),
+                "latitude": (("x", "y"), np.arange(-50, 50).reshape(10, -1)),
+            },
+            {
+                "latitude": (-50, 49, 7, -6.1),
+                "longitude": (-180, -81, -123, -136.1),
+            },
+        ),
+    ],
+)
+def test_add_coordinates_xarray_base(
+    feature_positions: tuple[tuple[float]],
+    coordinates: dict[str : tuple[str, np.ndarray]],
+    expected_val: dict[str : tuple[float]],
+):
+    """
+    Test that adding coordinates for xarray and iris are equal, using an
+    xarray generated dataset as the base.
+    Parameters
+    ----------
+    feature_positions: tuple of tuple of floats
+        Locations of the features to test in (hdim_1, hdim_2, zdim [optional]) coordinates
+    coordinates: dict, key: str; value: tuple of str, numpy array
+        Coordinates to use, in xarray coordinate style. Dims will be ('x', 'y', 'z') for 3D
+        data (determined by feature_positions) and ('x', 'y') for 2D data. All axes will have
+        size 10.
+    expected_val: dict, key: str; value: tuple of floats
+        Expected interpolated coordinates
+    """
+    all_indiv_feats = []
+    if len(feature_positions[0]) == 2:
+        is_3D = False
+    elif len(feature_positions[0]) == 3:
+        is_3D = True
+    else:
+        raise ValueError("Feature positions should be 2 or 3D")
+    for i, single_feat_position in enumerate(feature_positions):
+        if not is_3D and len(single_feat_position) == 2:
+            all_indiv_feats.append(
+                tbtest.generate_single_feature(
+                    single_feat_position[0],
+                    single_feat_position[1],
+                    feature_num=i,
+                    max_h1=10,
+                    max_h2=10,
+                )
+            )
+        elif is_3D and len(single_feat_position) == 3:
+            all_indiv_feats.append(
+                tbtest.generate_single_feature(
+                    single_feat_position[0],
+                    single_feat_position[1],
+                    start_v=single_feat_position[2],
+                    feature_num=i,
+                    max_h1=10,
+                    max_h2=10,
+                )
+            )
+        else:
+            raise ValueError("Feature positions should be 2 or 3D")
+    all_feats = pd.concat(all_indiv_feats)
+    da_size = (1, 10, 10, 10) if is_3D else (1, 10, 10)
+    dims = ("time", "x", "y", "z") if is_3D else ("time", "x", "y")
+    coordinates["time"] = np.array((datetime.datetime(2000, 1, 1, 0),))
+    da_with_coords = xr.DataArray(data=np.empty(da_size), dims=dims, coords=coordinates)
+    if is_3D:
+        iris_coord_interp = iris_utils.add_coordinates_3D(
+            all_feats, da_with_coords.to_iris()
+        )
+        xr_coord_interp = xr_utils.add_coordinates_to_features(
+            all_feats, da_with_coords
+        )
+    else:
+        iris_coord_interp = iris_utils.add_coordinates(
+            all_feats, da_with_coords.to_iris()
+        )
+        xr_coord_interp = xr_utils.add_coordinates_to_features(
+            all_feats, da_with_coords
+        )
+    for val_name in expected_val:
+        np.testing.assert_almost_equal(
+            iris_coord_interp[val_name], expected_val[val_name]
+        )
+        np.testing.assert_almost_equal(
+            xr_coord_interp[val_name], expected_val[val_name]
+        )
+        # assert (iris_coord_interp[val_name] == expected_val[val_name]).all()
+        # assert (xr_coord_interp[val_name] == expected_val[val_name]).all()
+    # Convert datetimes to ensure that they are the same type:
+    xr_coord_interp["time"] = datetime_utils.match_datetime_format(
+        xr_coord_interp.time, iris_coord_interp.time
+    )
+    pd.testing.assert_frame_equal(iris_coord_interp, xr_coord_interp)
+@pytest.mark.parametrize(
+    "coordinate_names, coordinate_standard_names",
+    [(("lat",), ("latitude",))],
+)
+def test_add_coordinates_xarray_std_names(
+    coordinate_names: tuple[str],
+    coordinate_standard_names: tuple[str],
+):
+    """
+    Test that adding coordinates for xarray and iris result in the same coordinate names
+    when standard_names are added to the xarray coordinates
+    Parameters
+    ----------
+    coordinate_names: tuple of str
+        names of coordinates to give
+    coordinate_standard_name: tuple of str
+        standard_names of coordinates to give
+    """
+    all_feats = tbtest.generate_single_feature(
+        0,
+        0,
+        feature_num=1,
+        max_h1=10,
+        max_h2=10,
+    )
+    da_size = (1, 10, 10)
+    dims = ("time", "x", "y")
+    coordinates = dict()
+    coordinates["time"] = np.array((datetime.datetime(2000, 1, 1, 0),))
+    for coord_name, coord_standard_name in zip(
+        coordinate_names, coordinate_standard_names
+    ):
+        coordinates[coord_name] = xr.DataArray(data=np.arange(10), dims="x")
+        coordinates[coord_name].attrs["standard_name"] = coord_standard_name
+    da_with_coords = xr.DataArray(data=np.empty(da_size), dims=dims, coords=coordinates)
+    iris_coord_interp = iris_utils.add_coordinates(
+        copy.deepcopy(all_feats), da_with_coords.to_iris()
+    )
+    xr_coord_interp = xr_utils.add_coordinates_to_features(
+        copy.deepcopy(all_feats), da_with_coords
+    )
+    xr_coord_interp["time"] = datetime_utils.match_datetime_format(
+        xr_coord_interp.time, iris_coord_interp.time
+    )
+    pd.testing.assert_frame_equal(iris_coord_interp, xr_coord_interp)
+def test_preserve_iris_datetime_types():
+    """
+    Test that xarray.add_coordinates_to_features correctly returns the same time types as
+    iris when preserve_iris_datetime_types = True.
+    """
+    all_feats = tbtest.generate_single_feature(
+        0,
+        0,
+        feature_num=1,
+        max_h1=10,
+        max_h2=10,
+    )
+    var_array: iris.cube.Cube = tbtest.make_simple_sample_data_2D(data_type="iris")
+    xarray_output = xr_utils.add_coordinates_to_features(
+        all_feats,
+        convert_cube_to_dataarray(var_array, preserve_iris_datetime_types=True),
+    )
+    iris_output = iris_utils.add_coordinates(all_feats, var_array)
+    pd.testing.assert_frame_equal(xarray_output, iris_output)
+    assert xarray_output["time"].values[0] == iris_output["time"].values[0]
+    assert isinstance(
+        xarray_output["time"].values[0], type(iris_output["time"].values[0])
+    )
+    xarray_output_datetime_preserve_off = xr_utils.add_coordinates_to_features(
+        all_feats,
+        convert_cube_to_dataarray(var_array, preserve_iris_datetime_types=False),
+    )
+    assert isinstance(
+        xarray_output_datetime_preserve_off["time"].values[0], np.datetime64
+    )