PyPI - ssb-sgis - Versions diffs - 1.0.2__py3-none-any.whl → 1.0.4__py3-none-any.whl - Mend

ssb-sgis 1.0.2py3-none-any.whl → 1.0.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (50) hide show

sgis/__init__.py +20 -9
sgis/debug_config.py +24 -0
sgis/exceptions.py +2 -2
sgis/geopandas_tools/bounds.py +33 -36
sgis/geopandas_tools/buffer_dissolve_explode.py +136 -35
sgis/geopandas_tools/centerlines.py +4 -91
sgis/geopandas_tools/cleaning.py +1576 -583
sgis/geopandas_tools/conversion.py +38 -19
sgis/geopandas_tools/duplicates.py +29 -8
sgis/geopandas_tools/general.py +263 -100
sgis/geopandas_tools/geometry_types.py +4 -4
sgis/geopandas_tools/neighbors.py +19 -15
sgis/geopandas_tools/overlay.py +2 -2
sgis/geopandas_tools/point_operations.py +5 -5
sgis/geopandas_tools/polygon_operations.py +510 -105
sgis/geopandas_tools/polygons_as_rings.py +40 -8
sgis/geopandas_tools/sfilter.py +29 -12
sgis/helpers.py +3 -3
sgis/io/dapla_functions.py +238 -19
sgis/io/read_parquet.py +1 -1
sgis/maps/examine.py +27 -12
sgis/maps/explore.py +450 -65
sgis/maps/legend.py +177 -76
sgis/maps/map.py +206 -103
sgis/maps/maps.py +178 -105
sgis/maps/thematicmap.py +243 -83
sgis/networkanalysis/_service_area.py +6 -1
sgis/networkanalysis/closing_network_holes.py +2 -2
sgis/networkanalysis/cutting_lines.py +15 -8
sgis/networkanalysis/directednetwork.py +1 -1
sgis/networkanalysis/finding_isolated_networks.py +15 -8
sgis/networkanalysis/networkanalysis.py +17 -19
sgis/networkanalysis/networkanalysisrules.py +1 -1
sgis/networkanalysis/traveling_salesman.py +1 -1
sgis/parallel/parallel.py +64 -27
sgis/raster/__init__.py +0 -6
sgis/raster/base.py +208 -0
sgis/raster/cube.py +54 -8
sgis/raster/image_collection.py +3257 -0
sgis/raster/indices.py +17 -5
sgis/raster/raster.py +138 -243
sgis/raster/sentinel_config.py +120 -0
sgis/raster/zonal.py +0 -1
{ssb_sgis-1.0.2.dist-info → ssb_sgis-1.0.4.dist-info}/METADATA +6 -7
ssb_sgis-1.0.4.dist-info/RECORD +62 -0
sgis/raster/methods_as_functions.py +0 -0
sgis/raster/torchgeo.py +0 -171
ssb_sgis-1.0.2.dist-info/RECORD +0 -61
{ssb_sgis-1.0.2.dist-info → ssb_sgis-1.0.4.dist-info}/LICENSE +0 -0
{ssb_sgis-1.0.2.dist-info → ssb_sgis-1.0.4.dist-info}/WHEEL +0 -0

sgis/maps/map.py CHANGED Viewed

@@ -4,6 +4,8 @@ This module holds the Map class, which is the basis for the Explore class.
 """
 import warnings
+from collections.abc import Sequence
+from statistics import mean
 from typing import Any
 import matplotlib
@@ -22,6 +24,10 @@ from ..geopandas_tools.general import clean_geoms
 from ..geopandas_tools.general import drop_inactive_geometry_columns
 from ..geopandas_tools.general import get_common_crs
 from ..helpers import get_object_name
+from ..helpers import unit_is_meters
+from ..raster.image_collection import Band
+from ..raster.image_collection import Image
+from ..raster.image_collection import ImageCollection
 try:
     from torchgeo.datasets.geo import RasterDataset
@@ -42,18 +48,18 @@ pd.options.mode.chained_assignment = None
 # similar colors. The palette is like the "Set2" cmap from matplotlib, but with more
 # colors. If more than 14 categories, the geopandas default cmap is used.
 _CATEGORICAL_CMAP = {
-    0: "#4576ff",
-    1: "#ff455e",
-    2: "#ffa617",
-    3: "#ff8cc9",
-    4: "#804e00",
-    5: "#99ff00",
-    6: "#fff700",
+    0: "#3b93ff",
+    1: "#ff3370",
+    2: "#f7cf19",
+    3: "#60e825",
+    4: "#ff8cc9",
+    5: "#804e00",
+    6: "#e3dc00",
     7: "#00ffee",
-    8: "#36d19b",
-    9: "#94006b",
-    10: "#750000",
+    9: "#870062",
+    10: "#751500",
     11: "#1c6b00",
+    8: "#7cebb9",
 }
 DEFAULT_SCHEME = "quantiles"
@@ -91,12 +97,12 @@ class Map:
         self,
         *gdfs: GeoDataFrame,
         column: str | None = None,
-        labels: tuple[str] | None = None,
         k: int = 5,
         bins: tuple[float] | None = None,
         nan_label: str = "Missing",
         nan_color="#c2c2c2",
         scheme: str = DEFAULT_SCHEME,
+        cmap: str | None = None,
         **kwargs,
     ) -> None:
         """Initialiser.
@@ -104,12 +110,13 @@ class Map:
         Args:
             *gdfs: Variable length GeoDataFrame list.
             column: The column name to work with.
-            labels: Tuple of labels for each GeoDataFrame.
             k: Number of bins or classes for classification (default: 5).
             bins: Predefined bins for data classification.
             nan_label: Label for missing data.
             nan_color: Color for missing data.
             scheme: Classification scheme to be used.
+            cmap (str): Colormap of the plot. See:
+                https://matplotlib.org/stable/tutorials/colors/colormaps.html
             **kwargs: Arbitrary keyword arguments.
         """
         gdfs, column, kwargs = self._separate_args(gdfs, column, kwargs)
@@ -119,27 +126,14 @@ class Map:
         self._k = k
         self.nan_label = nan_label
         self.nan_color = nan_color
-        self._cmap = kwargs.pop("cmap", None)
+        self._cmap = cmap
         self.scheme = scheme
-        if not all(isinstance(gdf, GeoDataFrame) for gdf in gdfs):
-            gdfs = [
-                to_gdf(gdf) if not isinstance(gdf, GeoDataFrame) else gdf
-                for gdf in gdfs
-            ]
-            if not all(isinstance(gdf, GeoDataFrame) for gdf in gdfs):
-                raise ValueError("gdfs must be GeoDataFrames.")
-        if "namedict" in kwargs:
-            for i, gdf in enumerate(gdfs):
-                gdf.name = kwargs["namedict"][i]
-            kwargs.pop("namedict")
         # need to get the object names of the gdfs before copying. Only getting,
         # not setting, labels. So the original gdfs don't get the label column.
-        self.labels = labels
-        if not self.labels:
-            self._get_labels(gdfs)
+        self.labels: list[str] = [
+            _determine_best_name(gdf, column, i) for i, gdf in enumerate(gdfs)
+        ]
         show = kwargs.pop("show", True)
         if isinstance(show, (int, bool)):
@@ -153,6 +147,7 @@ class Map:
             show_temp = show
         show_args = show_temp[: len(gdfs)]
+        # gdfs that are in kwargs
         show_kwargs = show_temp[len(gdfs) :]
         self._gdfs = []
         new_labels = []
@@ -165,31 +160,20 @@ class Map:
             if not len(gdf):
                 continue
-            self._gdfs.append(gdf)
+            self._gdfs.append(to_gdf(gdf))
             new_labels.append(label)
             self.show.append(show)
         self.labels = new_labels
-        # if len(self._gdfs):
-        #     last_show = self.show[-1]
-        # else:
-        #     last_show = show
         # pop all geometry-like items from kwargs into self._gdfs
         self.kwargs = {}
         i = 0
         for key, value in kwargs.items():
-            # if isinstance(value, GeoDataFrame):
-            #     self._gdfs.append(value)
-            #     self.labels.append(key)
-            #     try:
-            #         show = show_kwargs[i]
-            #     except IndexError:
-            #         pass
-            #     self.show.append(show)
-            #     i += 1
-            #     continue
             try:
+                if isinstance(value, Geometry):
+                    value = to_gdf(value)
+                if not len(value):
+                    continue
                 self._gdfs.append(to_gdf(value))
                 self.labels.append(key)
                 try:
@@ -207,11 +191,11 @@ class Map:
                 f"length as gdfs ({len(gdfs)}). Got len {len(show)}"
             )
-        if not any(len(gdf) for gdf in self._gdfs):
-            warnings.warn("None of the GeoDataFrames have rows.", stacklevel=1)
-            self._gdfs = None
+        if not self._gdfs or not any(len(gdf) for gdf in self._gdfs):
+            self._gdfs = []
             self._is_categorical = True
             self._unique_values = []
+            self._nan_idx = []
             return
         if not self.labels:
@@ -241,6 +225,10 @@ class Map:
         self._nan_idx = self._gdf[self._column].isna()
         self._get_unique_values()
+    def __bool__(self) -> bool:
+        """True of any gdfs with more than 0 rows."""
+        return bool(len(self._gdfs) + len(self._gdf))
     def _get_unique_values(self) -> None:
         if not self._is_categorical:
             self._unique_values = self._get_unique_floats()
@@ -262,7 +250,7 @@ class Map:
         Because floats don't always equal each other. This will make very
         similar values count as the same value in the color classification.
         """
-        array = self._gdf.loc[~self._nan_idx, self._column]
+        array = self._gdf.loc[list(~self._nan_idx), self._column]
         self._min = np.min(array)
         self._max = np.max(array)
         self._get_multiplier(array)
@@ -313,29 +301,70 @@ class Map:
         # make sure they are lists
         bins = [bin_ for bin_ in bins]
-        if min(bins) > 0 and min(self._gdf.loc[~self._nan_idx, self._column]) < min(
-            bins
-        ):
-            bins = [min(self._gdf.loc[~self._nan_idx, self._column])] + bins
-        if min(bins) < 0 and min(self._gdf.loc[~self._nan_idx, self._column]) < min(
-            bins
-        ):
-            bins = [min(self._gdf.loc[~self._nan_idx, self._column])] + bins
+        if min(bins) > 0 and min(
+            self._gdf.loc[list(~self._nan_idx), self._column]
+        ) < min(bins):
+            num = min(self._gdf.loc[list(~self._nan_idx), self._column])
+            # if isinstance(num, float):
+            #     num -= (
+            #         float(f"1e-{abs(self.legend.rounding)}")
+            #         if self.legend and self.legend.rounding
+            #         else 0
+            #     )
+            bins = [num] + bins
+        if min(bins) < 0 and min(
+            self._gdf.loc[list(~self._nan_idx), self._column]
+        ) < min(bins):
+            num = min(self._gdf.loc[list(~self._nan_idx), self._column])
+            # if isinstance(num, float):
+            #     num -= (
+            #         float(f"1e-{abs(self.legend.rounding)}")
+            #         if self.legend and self.legend.rounding
+            #         else 0
+            #     )
+            bins = [num] + bins
         if max(bins) > 0 and max(
             self._gdf.loc[self._gdf[self._column].notna(), self._column]
         ) > max(bins):
-            bins = bins + [
-                max(self._gdf.loc[self._gdf[self._column].notna(), self._column])
-            ]
+            num = max(self._gdf.loc[self._gdf[self._column].notna(), self._column])
+            # if isinstance(num, float):
+            #     num += (
+            #         float(f"1e-{abs(self.legend.rounding)}")
+            #         if self.legend and self.legend.rounding
+            #         else 0
+            #     )
+            bins = bins + [num]
         if max(bins) < 0 and max(
             self._gdf.loc[self._gdf[self._column].notna(), self._column]
         ) < max(bins):
-            bins = bins + [
-                max(self._gdf.loc[self._gdf[self._column].notna(), self._column])
-            ]
+            num = max(self._gdf.loc[self._gdf[self._column].notna(), self._column])
+            # if isinstance(num, float):
+            #     num += (
+            #         float(f"1e-{abs(self.legend.rounding)}")
+            #         if self.legend and self.legend.rounding
+            #         else 0
+            #     )
+            bins = bins + [num]
+        def adjust_bin(num: int | float, i: int) -> int | float:
+            if isinstance(num, int):
+                return num
+            adjuster = (
+                float(f"1e-{abs(self.legend.rounding)}")
+                if self.legend and self.legend.rounding
+                else 0
+            )
+            if i == 0:
+                return num - adjuster
+            elif i == len(bins) - 1:
+                return num + adjuster
+            return num
+        bins = [adjust_bin(x, i) for i, x in enumerate(bins)]
         return bins
@@ -347,16 +376,26 @@ class Map:
     ) -> tuple[tuple[GeoDataFrame], str]:
         """Separate GeoDataFrames from string (column argument)."""
-        def as_dict(obj):
+        def as_dict(obj) -> dict:
             if hasattr(obj, "__dict__"):
                 return obj.__dict__
             elif isinstance(obj, dict):
                 return obj
-            raise TypeError
-        allowed_types = (GeoDataFrame, GeoSeries, Geometry, RasterDataset)
+            raise TypeError(type(obj))
+        allowed_types = (
+            GeoDataFrame,
+            GeoSeries,
+            Geometry,
+            RasterDataset,
+            ImageCollection,
+            Image,
+            Band,
+        )
-        gdfs: tuple[GeoDataFrame | GeoSeries | Geometry | RasterDataset] = ()
+        gdfs = ()
+        more_gdfs = {}
+        i = 0
         for arg in args:
             if isinstance(arg, str):
                 if column is None:
@@ -367,12 +406,31 @@ class Map:
                     )
             elif isinstance(arg, allowed_types):
                 gdfs = gdfs + (arg,)
+            # elif isinstance(arg, Sequence) and not isinstance(arg, str):
             elif isinstance(arg, dict) or hasattr(arg, "__dict__"):
                 # add dicts or classes with GeoDataFrames to kwargs
-                more_gdfs = {}
                 for key, value in as_dict(arg).items():
                     if isinstance(value, allowed_types):
                         more_gdfs[key] = value
+                    elif isinstance(value, dict) or hasattr(value, "__dict__"):
+                        # elif isinstance(value, Sequence) and not isinstance(value, str):
+                        try:
+                            # same as above, one level down
+                            more_gdfs |= {
+                                k: v
+                                for k, v in as_dict(value).items()
+                                if isinstance(v, allowed_types)
+                            }
+                        except Exception:
+                            # ignore all exceptions
+                            pass
+            elif isinstance(arg, Sequence) and not isinstance(arg, str):
+                # add dicts or classes with GeoDataFrames to kwargs
+                for value in arg:
+                    if isinstance(value, allowed_types):
+                        name = _determine_best_name(value, column, i)
+                        more_gdfs[name] = value
                     elif isinstance(value, dict) or hasattr(value, "__dict__"):
                         try:
                             # same as above, one level down
@@ -384,8 +442,15 @@ class Map:
                         except Exception:
                             # no need to raise here
                             pass
+                    elif isinstance(value, Sequence) and not isinstance(value, str):
+                        for x in value:
+                            if not isinstance(x, allowed_types):
+                                continue
+                            name = _determine_best_name(value, column, i)
+                            more_gdfs[name] = x
+                    i += 1
-                kwargs |= more_gdfs
+        kwargs |= more_gdfs
         return gdfs, column, kwargs
@@ -394,7 +459,7 @@ class Map:
         if self.scheme is None:
             return
-        if not self.bins:
+        if self.bins is None:
             self.bins = self._create_bins(self._gdf, self._column)
             if len(self.bins) <= self._k and len(self.bins) != len(self._unique_values):
                 self._k = len(self.bins)
@@ -406,17 +471,6 @@ class Map:
             self._unique_values = self.nan_label
             self._k = 1
-    def _get_labels(self, gdfs: tuple[GeoDataFrame]) -> None:
-        """Putting the labels/names in a list before copying the gdfs."""
-        self.labels: list[str] = []
-        for i, gdf in enumerate(gdfs):
-            if hasattr(gdf, "name") and isinstance(gdf.name, str):
-                name = gdf.name
-            else:
-                name = get_object_name(gdf)
-                name = name or str(i)
-            self.labels.append(name)
     def _set_labels(self) -> None:
         """Setting the labels after copying the gdfs."""
         gdfs = []
@@ -467,10 +521,21 @@ class Map:
     def _check_if_categorical(self) -> bool:
         """Quite messy this..."""
-        if not self._column:
+        if not self._column or not self._gdfs:
             return True
+        def is_maybe_km2():
+            if "area" in self._column and (
+                "km2" in self._column
+                or "kilomet" in self._column
+                and ("sq" in self._column or "2" in self._column)
+            ):
+                return True
+            else:
+                return False
         maybe_area = 1 if "area" in self._column else 0
+        maybe_area_km2 = 1 if is_maybe_km2() else 0
         maybe_length = (
             1 if any(x in self._column for x in ["meter", "metre", "leng"]) else 0
         )
@@ -479,7 +544,10 @@ class Map:
         col_not_present = 0
         for gdf in self._gdfs:
             if self._column not in gdf:
-                if maybe_area:
+                if maybe_area_km2 and unit_is_meters(gdf):
+                    gdf["area_km2"] = gdf.area / 1_000_000
+                    maybe_area_km2 += 1
+                elif maybe_area:
                     gdf["area"] = gdf.area
                     maybe_area += 1
                 elif maybe_length:
@@ -492,6 +560,9 @@ class Map:
                     all_nan += 1
                 return True
+        if maybe_area_km2 > 1:
+            self._column = "area_km2"
+            return False
         if maybe_area > 1:
             self._column = "area"
             return False
@@ -500,14 +571,16 @@ class Map:
             return False
         if all_nan == len(self._gdfs):
-            raise ValueError(f"All values are NaN in column {self.column!r}.")
+            raise ValueError(
+                f"All values are NaN in column {self.column!r}. {self._gdfs}"
+            )
         if col_not_present == len(self._gdfs):
             raise ValueError(f"{self.column} not found.")
         return False
-    def _get_categorical_colors(self) -> None:
+    def _make_categories_colors_dict(self) -> None:
         # custom categorical cmap
         if not self._cmap and len(self._unique_values) <= len(_CATEGORICAL_CMAP):
             self._categories_colors_dict = {
@@ -529,6 +602,7 @@ class Map:
                 for i, category in enumerate(self._unique_values)
             }
+    def _fix_nans(self) -> None:
         if any(self._nan_idx):
             self._gdf[self._column] = self._gdf[self._column].fillna(self.nan_label)
             self._categories_colors_dict[self.nan_label] = self.nan_color
@@ -549,7 +623,7 @@ class Map:
         If 'scheme' is not specified, the jenks_breaks function is used, which is
         much faster than the one from Mapclassifier.
         """
-        if not len(gdf.loc[~self._nan_idx, column]):
+        if not len(gdf.loc[list(~self._nan_idx), column]):
             return np.array([0])
         n_classes = (
@@ -565,29 +639,26 @@ class Map:
             n_classes = len(self._unique_values)
         if self.scheme == "jenks":
-            try:
-                bins = jenks_breaks(
-                    gdf.loc[~self._nan_idx, column], n_classes=n_classes
-                )
-                bins = self._add_minmax_to_bins(bins)
-            except Exception:
-                pass
+            bins = jenks_breaks(
+                gdf.loc[list(~self._nan_idx), column], n_classes=n_classes
+            )
         else:
             binning = classify(
-                np.asarray(gdf.loc[~self._nan_idx, column]),
+                np.asarray(gdf.loc[list(~self._nan_idx), column]),
                 scheme=self.scheme,
-                k=self._k,
+                # k=self._k,
+                k=n_classes,
             )
             bins = binning.bins
-            bins = self._add_minmax_to_bins(bins)
+        bins = self._add_minmax_to_bins(bins)
         unique_bins = list({round(bin_, 5) for bin_ in bins})
         unique_bins.sort()
-        if self._k == len(self._unique_values) - 1:
-            return np.array(unique_bins)
-        if len(unique_bins) == len(self._unique_values):
+        if self._k == len(self._unique_values) - 1 or len(unique_bins) == len(
+            self._unique_values
+        ):
             return np.array(unique_bins)
         if len(unique_bins) == len(bins) - 1:
@@ -624,6 +695,8 @@ class Map:
     def _classify_from_bins(self, gdf: GeoDataFrame, bins: np.ndarray) -> np.ndarray:
         """Place the column values into groups."""
+        bins = bins.copy()
         # if equal lenght, convert to integer and check for equality
         if len(bins) == len(self._unique_values):
             if gdf[self._column].isna().all():
@@ -638,6 +711,14 @@ class Map:
             if len(bins) == self._k + 1:
                 bins = bins[1:]
+            if (
+                self.legend
+                and self.legend.rounding
+                and (self.legend.rounding or 1) <= 0
+            ):
+                bins[0] = bins[0] - 1
+                bins[-1] = bins[-1] + 1
             if gdf[self._column].isna().all():
                 return np.repeat(len(bins), len(gdf))
@@ -686,7 +767,8 @@ class Map:
     @cmap.setter
     def cmap(self, new_value: str) -> None:
         self._cmap = new_value
-        self.change_cmap(cmap=new_value, start=self.cmap_start, stop=self.cmap_stop)
+        if not self._is_categorical:
+            self.change_cmap(cmap=new_value, start=self.cmap_start, stop=self.cmap_stop)
     @property
     def gdf(self) -> GeoDataFrame:
@@ -738,3 +820,24 @@ class Map:
             return self[key]
         except (KeyError, ValueError, IndexError, AttributeError):
             return default
+def _determine_best_name(obj: Any, column: str | None, i: int) -> str:
+    try:
+        # Frame 3: actual object name Frame 2: maps.py:explore(). Frame 1: __init__. Frame 0: this function.
+        return str(get_object_name(obj, start=3))
+    except ValueError:
+        if isinstance(obj, GeoSeries) and obj.name:
+            return str(obj.name)
+        elif isinstance(obj, GeoDataFrame) and len(obj.columns) == 2 and not column:
+            series = obj.drop(columns=obj._geometry_column_name).iloc[:, 0]
+            if (
+                len(series.unique()) == 1
+                and mean(isinstance(x, str) for x in series) > 0.5
+            ):
+                return str(next(iter(series)))
+            elif series.name:
+                return str(series.name)
+        else:
+            # generic label e.g. Image(1)
+            return f"{obj.__class__.__name__}({i})"

ssb-sgis 1.0.2__py3-none-any.whl → 1.0.4__py3-none-any.whl

ssb-sgis 1.0.2py3-none-any.whl → 1.0.4py3-none-any.whl