PyPI - ssb-sgis - Versions diffs - 1.0.2__py3-none-any.whl → 1.0.4__py3-none-any.whl - Mend

ssb-sgis 1.0.2py3-none-any.whl → 1.0.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (50) hide show

sgis/__init__.py +20 -9
sgis/debug_config.py +24 -0
sgis/exceptions.py +2 -2
sgis/geopandas_tools/bounds.py +33 -36
sgis/geopandas_tools/buffer_dissolve_explode.py +136 -35
sgis/geopandas_tools/centerlines.py +4 -91
sgis/geopandas_tools/cleaning.py +1576 -583
sgis/geopandas_tools/conversion.py +38 -19
sgis/geopandas_tools/duplicates.py +29 -8
sgis/geopandas_tools/general.py +263 -100
sgis/geopandas_tools/geometry_types.py +4 -4
sgis/geopandas_tools/neighbors.py +19 -15
sgis/geopandas_tools/overlay.py +2 -2
sgis/geopandas_tools/point_operations.py +5 -5
sgis/geopandas_tools/polygon_operations.py +510 -105
sgis/geopandas_tools/polygons_as_rings.py +40 -8
sgis/geopandas_tools/sfilter.py +29 -12
sgis/helpers.py +3 -3
sgis/io/dapla_functions.py +238 -19
sgis/io/read_parquet.py +1 -1
sgis/maps/examine.py +27 -12
sgis/maps/explore.py +450 -65
sgis/maps/legend.py +177 -76
sgis/maps/map.py +206 -103
sgis/maps/maps.py +178 -105
sgis/maps/thematicmap.py +243 -83
sgis/networkanalysis/_service_area.py +6 -1
sgis/networkanalysis/closing_network_holes.py +2 -2
sgis/networkanalysis/cutting_lines.py +15 -8
sgis/networkanalysis/directednetwork.py +1 -1
sgis/networkanalysis/finding_isolated_networks.py +15 -8
sgis/networkanalysis/networkanalysis.py +17 -19
sgis/networkanalysis/networkanalysisrules.py +1 -1
sgis/networkanalysis/traveling_salesman.py +1 -1
sgis/parallel/parallel.py +64 -27
sgis/raster/__init__.py +0 -6
sgis/raster/base.py +208 -0
sgis/raster/cube.py +54 -8
sgis/raster/image_collection.py +3257 -0
sgis/raster/indices.py +17 -5
sgis/raster/raster.py +138 -243
sgis/raster/sentinel_config.py +120 -0
sgis/raster/zonal.py +0 -1
{ssb_sgis-1.0.2.dist-info → ssb_sgis-1.0.4.dist-info}/METADATA +6 -7
ssb_sgis-1.0.4.dist-info/RECORD +62 -0
sgis/raster/methods_as_functions.py +0 -0
sgis/raster/torchgeo.py +0 -171
ssb_sgis-1.0.2.dist-info/RECORD +0 -61
{ssb_sgis-1.0.2.dist-info → ssb_sgis-1.0.4.dist-info}/LICENSE +0 -0
{ssb_sgis-1.0.2.dist-info → ssb_sgis-1.0.4.dist-info}/WHEEL +0 -0

sgis/maps/thematicmap.py CHANGED Viewed

@@ -10,8 +10,10 @@ import numpy as np
 import pandas as pd
 from geopandas import GeoDataFrame
+from .legend import LEGEND_KWARGS
 from .legend import ContinousLegend
 from .legend import Legend
+from .legend import prettify_bins
 from .map import Map
 # the geopandas._explore raises a deprication warning. Ignoring for now.
@@ -20,60 +22,132 @@ warnings.filterwarnings(
 )
 pd.options.mode.chained_assignment = None
+MAP_KWARGS = {
+    "bins",
+    "title",
+    "title_fontsize",
+    "size",
+    "cmap",
+    "cmap_start",
+    "cmap_stop",
+    "scheme",
+    "k",
+    "column",
+    "title_color",
+    "facecolor",
+    "labelcolor",
+    "nan_color",
+    "title_kwargs",
+    "bg_gdf_color",
+    "title_position",
+}
 class ThematicMap(Map):
-    """Class for creating static maps with geopandas and matplotlib.
-    The class takes one or more GeoDataFrames and a column name. The class attributes
-    can then be set to customise the map before plotting.
-    Attributes:
-        size (int): Width and height of the plot in inches.
-        k (int): Number of color groups.
-        legend (Legend): The legend object of the map. The legend holds its own set of
-            attributes. See the Legend class for details.
-        title (str): Title of the plot.
-        title_color (str): Color of the title font.
-        title_fontsize (int): Color of the title font.
-        bins (list[int | float]): For numeric columns. List of numbers that define the
-            maximum value for the color groups.
-        cmap (str): Colormap of the plot. See:
+    """Class for making static maps.
+    Args:
+        *gdfs: One or more GeoDataFrames.
+        column: The name of the column to plot.
+        title: Title of the plot.
+        title_position: Title position. Either "center" (default), "left" or "right".
+        size: Width and height of the plot in inches. Fontsize of title and legend is
+            adjusted accordingly. Defaults to 25.
+        dark: If False (default), the background will be white and the text black. If
+            True, the background will be black and the text white. When True, the
+            default cmap is "viridis", and when False, the default is red to purple
+            (RdPu).
+        cmap: Colormap of the plot. See:
             https://matplotlib.org/stable/tutorials/colors/colormaps.html
-        cmap_start (int): Start position for the color palette.
-        cmap_stop (int): End position for the color palette.
-        facecolor (str): Background color.
+        scheme: How to devide numeric values into categories. Defaults to
+            "naturalbreaks".
+        k: Number of color groups.
+        bins: For numeric columns. List of numbers that define the
+            maximum value for the color groups.
+        nan_label: Label for missing data.
+        legend_kwargs: dictionary with attributes for the legend. E.g.:
+            title: Legend title. Defaults to the column name.
+            rounding: If positive number, it will round floats to n decimals.
+            If negative, eg. -2, the number 3429 is rounded to 3400.
+            By default, the rounding depends on the column's maximum value
+            and standard deviation.
+            position: The legend's x and y position in the plot. By default, it's
+            decided dynamically by finding the space with most distance to
+            the geometries. To be specified as a tuple of
+            x and y position between 0 and 1. E.g. position=(0.8, 0.2) for a position
+            in the bottom right corner, (0.2, 0.8) for the upper left corner.
+            pretty_labels: Whether to capitalize words in text categories.
+            label_suffix: For numeric columns. The text to put after each number
+            in the legend labels. Defaults to None.
+            label_sep: For numeric columns. Text to put in between the two numbers
+            in each color group in the legend. Defaults to '-'.
+            thousand_sep: For numeric columns. Separator between each thousand for
+            large numbers. Defaults to None, meaning no separator.
+            decimal_mark: For numeric columns. Text to use as decimal point.
+            Defaults to None, meaning '.' (dot) unless 'thousand_sep' is
+            '.'. In this case, ',' (comma) will be used as decimal mark.
+        **kwargs: Additional attributes for the map. E.g.:
+            title_color (str): Color of the title font.
+            title_fontsize (int): Color of the title font.
+            cmap_start (int): Start position for the color palette.
+            cmap_stop (int): End position for the color palette.
+            facecolor (str): Background color.
+            labelcolor (str): Color for the labels.
+            nan_color: Color for missing data.
     Examples:
-    --------
+    ---------
     >>> import sgis as sg
-    >>> points = sg.random_points(100).pipe(sg.buff, np.random.rand(100))
-    >>> points2 = sg.random_points(100).pipe(sg.buff, np.random.rand(100))
+    >>> points = sg.random_points(100, loc=1000).pipe(sg.buff, np.random.rand(100) * 100)
+    >>> points2 = sg.random_points(100, loc=1000).pipe(sg.buff, np.random.rand(100) * 100)
     Simple plot with legend and title.
-    >>> m = sg.ThematicMap(points, points2, "area")
-    >>> m.title = "Area of random circles"
+    >>> m = sg.ThematicMap(points, points2, column="area", title="Area of random circles")
     >>> m.plot()
-    Plot with custom legend units (label_suffix) and separator (label_sep).
-    >>> m = sg.ThematicMap(points, points2, "area")
-    >>> m.title = "Area of random circles"
-    >>> m.legend.label_suffix = "m2"
-    >>> m.legend.label_sep = "to"
+    Plot with custom legend units (label_suffix) and thousand separator.
+    And with rounding set to -2, meaning e.g. 3429 is rounded to 3400.
+    If rounding was set to positive 2, 3429 would be rounded to 3429.00.
+    >>> m = sg.ThematicMap(
+    ...     points,
+    ...     points2,
+    ...     column="area",
+    ...     title = "Area of random circles",
+    ...     legend_kwargs=dict(
+    ...         rounding=-2,
+    ...         thousand_sep=" ",
+    ...         label_sep="to",
+    ...     ),
+    ... )
     >>> m.plot()
-    With custom bins and legend labels.
-    >>> m = sg.ThematicMap(points, points2, "area")
-    >>> m.title = "Area of random circles"
-    >>> m.bins = [1, 2, 3]
-    >>> m.legend.labels = [
-    ...     f"{int(round(min(points.length),0))} to 1",
-    ...     "1 to 2",
-    ...     "2 to 3",
-    ...     f"3 to {int(round(max(points.length),0))}",
-    ... ]
+    With custom bins for the categories, and other customizations.
+    >>> m = sg.ThematicMap(
+    ...     points,
+    ...     points2,
+    ...     column="area",
+    ...     cmap="Greens",
+    ...     cmap_start=50,
+    ...     cmap_stop=255,
+    ...     nan_label="Missing",
+    ...     title = "Area of random circles",
+    ...     bins = [5000, 10000, 15000, 20000],
+    ...     title_kwargs=dict(
+    ...         loc="left",
+    ...         y=0.93,
+    ...         x=0.025,
+    ...     ),
+    ...     legend_kwargs=dict(
+    ...         thousand_sep=" ",
+    ...         label_sep="to",
+    ...         decimal_mark=".",
+    ...         label_suffix="m2",
+    ...     ),
+    ... )
     >>> m.plot()
     """
@@ -81,37 +155,105 @@ class ThematicMap(Map):
         self,
         *gdfs: GeoDataFrame,
         column: str | None = None,
+        title: str | None = None,
+        title_position: tuple[float, float] | None = None,
         size: int = 25,
-        black: bool = False,
+        dark: bool = False,
+        cmap: str | None = None,
+        scheme: str = "naturalbreaks",
+        k: int = 5,
+        bins: tuple[float] | None = None,
+        nan_label: str = "Missing",
+        legend_kwargs: dict | None = None,
+        title_kwargs: dict | None = None,
+        legend: bool = False,
+        **kwargs,
     ) -> None:
-        """Initialiser.
-        Args:
-            *gdfs: One or more GeoDataFrames.
-            column: The name of the column to plot.
-            size: Width and height of the plot in inches. Fontsize of title and legend is
-                adjusted accordingly. Defaults to 25.
-            black: If False (default), the background will be white and the text black. If
-                True, the background will be black and the text white. When True, the
-                default cmap is "viridis", and when False, the default is red to purple
-                (RdPu).
+        """Initialiser."""
+        super().__init__(
+            *gdfs,
+            column=column,
+            scheme=scheme,
+            k=k,
+            bins=bins,
+            nan_label=nan_label,
+        )
-        """
-        super().__init__(*gdfs, column=column)
+        if not legend:
+            self.legend = None
+        self.title = title
         self._size = size
-        self._black = black
+        self._dark = dark
+        self.title_kwargs = title_kwargs or {}
+        if title_position and "position" in self.title_kwargs:
+            raise TypeError(
+                "Specify either 'title_position' or title_kwargs position, not both."
+            )
+        if title_position or "position" in self.title_kwargs:
+            position = self.title_kwargs.pop("position", title_position)
+            error_mess = (
+                "legend_kwargs position should be a two length tuple/list with two numbers between "
+                "0 and 1 (x, y position)"
+            )
+            if not hasattr(position, "__len__"):
+                raise TypeError(error_mess)
+            if len(position) != 2:
+                raise ValueError(error_mess)
+            x, y = position
+            if "loc" not in self.title_kwargs:
+                if x < 0.4:
+                    self.title_kwargs["loc"] = "left"
+                elif x > 0.6:
+                    self.title_kwargs["loc"] = "right"
+                else:
+                    self.title_kwargs["loc"] = "center"
+            self.title_kwargs["x"], self.title_kwargs["y"] = x, y
         self.background_gdfs = []
-        self._title_fontsize = self._size * 2
+        legend_kwargs = legend_kwargs or {}
-        self.black = black
+        self._title_fontsize = self._size * 1.9
-        if not self._is_categorical:
+        black = kwargs.pop("black", None)
+        self._dark = self._dark or black
+        if not self.cmap and not self._is_categorical:
             self._choose_cmap()
+        self._dark_or_light()
         self._create_legend()
+        if cmap:
+            self._cmap = cmap
+        for key, value in kwargs.items():
+            if key not in MAP_KWARGS:
+                raise TypeError(
+                    f"{self.__class__.__name__} got an unexpected keyword argument {key}"
+                )
+            try:
+                setattr(self, key, value)
+            except Exception:
+                setattr(self, f"_{key}", value)
+        for key, value in legend_kwargs.items():
+            if key not in LEGEND_KWARGS:
+                raise TypeError(
+                    f"{self.__class__.__name__} legend_kwargs got an unexpected key {key}"
+                )
+            if self.legend is not None:
+                try:
+                    setattr(self.legend, key, value)
+                except Exception:
+                    setattr(self.legend, f"_{key}", value)
+    @property
+    def valid_keywords(self) -> set[str]:
+        """List all valid keywords for the class initialiser."""
+        return MAP_KWARGS
     def change_cmap(self, cmap: str, start: int = 0, stop: int = 256) -> "ThematicMap":
         """Change the color palette of the plot.
@@ -177,7 +319,7 @@ class ThematicMap(Map):
         else:
             kwargs = self._prepare_continous_plot(kwargs)
             if self.legend:
-                if not self.legend._rounding_has_been_set:
+                if not self.legend.rounding:
                     self.legend._rounding = self.legend._get_rounding(
                         array=self._gdf.loc[~self._nan_idx, self._column]
                     )
@@ -194,15 +336,15 @@ class ThematicMap(Map):
                 self._gdf, k=self._k + bool(len(self._nan_idx))
             )
-        if __test:
-            return
         self._prepare_plot(**kwargs)
         if self.legend:
             self.ax = self.legend._actually_add_legend(ax=self.ax)
-        self._gdf.plot(legend=include_legend, ax=self.ax, **kwargs)
+        self.ax = self._gdf.plot(legend=include_legend, ax=self.ax, **kwargs)
+        if __test:
+            return self
     def save(self, path: str) -> None:
         """Save figure as image file.
@@ -238,9 +380,13 @@ class ThematicMap(Map):
         if hasattr(self, "_background_gdfs"):
             self._actually_add_background()
-        if hasattr(self, "title") and self.title:
+        if self.title:
             self.ax.set_title(
-                self.title, fontsize=self.title_fontsize, color=self.title_color
+                self.title,
+                **(
+                    dict(fontsize=self.title_fontsize, color=self.title_color)
+                    | self.title_kwargs
+                ),
             )
     def _prepare_continous_plot(self, kwargs: dict) -> dict:
@@ -257,6 +403,13 @@ class ThematicMap(Map):
             return kwargs
         else:
+            if self.legend and self.legend.rounding and self.legend.rounding < 0:
+                self.bins = prettify_bins(self.bins, self.legend.rounding)
+                self.bins = list({round(bin_, 5) for bin_ in self.bins})
+                self.bins.sort()
+                # self.legend._rounding_was = self.legend.rounding
+                # self.legend.rounding = None
             classified = self._classify_from_bins(self._gdf, bins=self.bins)
             classified_sequential = self._push_classification(classified)
             n_colors = len(np.unique(classified_sequential)) - any(self._nan_idx)
@@ -264,10 +417,13 @@ class ThematicMap(Map):
             self._bins_unique_values = self._make_bin_value_dict(
                 self._gdf, classified_sequential
             )
             colorarray = self._unique_colors[classified_sequential]
             kwargs["color"] = colorarray
-        if self.legend and not self.legend._rounding_has_been_set:
+        if (
+            self.legend and self.legend.rounding
+        ):  # not self.legend._rounding_has_been_set:
             self.bins = self.legend._set_rounding(
                 bins=self.bins, rounding=self.legend._rounding
             )
@@ -279,10 +435,13 @@ class ThematicMap(Map):
     def _prepare_categorical_plot(self, kwargs: dict) -> dict:
         """Map values to colors."""
-        self._get_categorical_colors()
-        colorarray = self._gdf["color"]
+        self._make_categories_colors_dict()
+        if self._gdf is not None and len(self._gdf):
+            self._fix_nans()
-        kwargs["color"] = colorarray
+        if self._gdf is not None:
+            colorarray = self._gdf["color"]
+            kwargs["color"] = colorarray
         return kwargs
     def _actually_add_legend(self) -> None:
@@ -309,8 +468,10 @@ class ThematicMap(Map):
     def _create_legend(self) -> None:
         """Instantiate the Legend class."""
+        if self.legend is None:
+            return
         kwargs = {}
-        if self._black:
+        if self._dark:
             kwargs["facecolor"] = "#0f0f0f"
             kwargs["labelcolor"] = "#fefefe"
             kwargs["title_color"] = "#fefefe"
@@ -322,7 +483,7 @@ class ThematicMap(Map):
     def _choose_cmap(self) -> None:
         """Kwargs is to catch start and stop points for the cmap in __init__."""
-        if self._black:
+        if self._dark:
             self._cmap = "viridis"
             self.cmap_start = 0
             self.cmap_stop = 256
@@ -352,8 +513,8 @@ class ThematicMap(Map):
         ax = fig.add_subplot(1, 1, 1)
         return fig, ax
-    def _black_or_white(self) -> None:
-        if self._black:
+    def _dark_or_light(self) -> None:
+        if self._dark:
             self.facecolor, self.title_color, self.bg_gdf_color = (
                 "#0f0f0f",
                 "#fefefe",
@@ -367,23 +528,22 @@ class ThematicMap(Map):
             self.facecolor, self.title_color, self.bg_gdf_color = (
                 "#fefefe",
                 "#0f0f0f",
-                "#ebebeb",
+                "#dbdbdb",
             )
             self.nan_color = "#c2c2c2"
             if not self._is_categorical:
                 self.change_cmap("RdPu", start=23)
-        self._create_legend()
     @property
-    def black(self) -> bool:
+    def dark(self) -> bool:
         """Whether to use dark background and light text colors."""
-        return self._black
+        return self._dark
-    @black.setter
-    def black(self, new_value: bool):
-        self._black = new_value
-        self._black_or_white()
+    @dark.setter
+    def dark(self, new_value: bool):
+        self._dark = new_value
+        self._dark_or_light()
+        self._create_legend()
     @property
     def title_fontsize(self) -> int:

sgis/networkanalysis/_service_area.py CHANGED Viewed

@@ -5,6 +5,7 @@ from igraph import Graph
 from shapely import force_2d
 from shapely import reverse
 from shapely import unary_union
+from shapely import union_all
 from shapely.geometry import MultiPoint
 from shapely.geometry import Point
 from shapely.ops import nearest_points
@@ -113,7 +114,11 @@ def _service_area(
                 else:
                     snapped_origin: Point = nearest_points(
                         nodes_union,
-                        origins.loc[origins["temp_idx"] == idx, "geometry"].unary_union,
+                        union_all(
+                            origins.loc[
+                                origins["temp_idx"] == idx, "geometry"
+                            ].geometry.values
+                        ),
                     )[0]
                     within = sfilter(within, snapped_origin.buffer(0.01))

sgis/networkanalysis/closing_network_holes.py CHANGED Viewed

@@ -44,7 +44,7 @@ def close_network_holes(
         NetworkAnalysis. These values must be filled before analysis.
     Examples:
-    --------
+    ---------
     Read road data with small gaps.
     >>> import sgis as sg
@@ -157,7 +157,7 @@ def close_network_holes_to_deadends(
         The input GeoDataFrame with new lines added.
     Examples:
-    --------
+    ---------
     Read road data with small gaps.
     >>> import sgis as sg

sgis/networkanalysis/cutting_lines.py CHANGED Viewed

@@ -52,7 +52,7 @@ def split_lines_by_nearest_point(
         ValueError: If the crs of the input data differs.
     Examples:
-    --------
+    ---------
     >>> from sgis import read_parquet_url, split_lines_by_nearest_point
     >>> roads = read_parquet_url("https://media.githubusercontent.com/media/statisticsnorway/ssb-sgis/main/tests/testdata/roads_oslo_2022.parquet")
     >>> points = read_parquet_url("https://media.githubusercontent.com/media/statisticsnorway/ssb-sgis/main/tests/testdata/points_oslo.parquet")
@@ -77,7 +77,7 @@ def split_lines_by_nearest_point(
     """
     PRECISION = 1e-6
-    if not len(gdf):
+    if not len(gdf) or not len(points):
         return gdf
     if (points.crs is not None and gdf.crs is not None) and not points.crs.equals(
@@ -86,10 +86,14 @@ def split_lines_by_nearest_point(
         raise ValueError("crs mismatch:", points.crs, "and", gdf.crs)
     if get_geom_type(gdf) != "line":
-        raise ValueError("'gdf' should only have line geometries.", gdf.geom_type)
+        raise ValueError(
+            f"'gdf' should only have line geometriess. Got {gdf.geom_type.value_counts()}"
+        )
     if get_geom_type(points) != "point":
-        raise ValueError("'points' should only have point geometries.")
+        raise ValueError(
+            f"'points' should only have point geometries. Got {points.geom_type.value_counts()}"
+        )
     gdf = gdf.copy()
@@ -230,9 +234,12 @@ def _change_line_endpoint(
         .values
     )
-    relevant_lines_mapped = relevant_lines.groupby(level=0)["geometry"].agg(LineString)
+    is_line = relevant_lines.groupby(level=0).size() > 1
+    relevant_lines_mapped = (
+        relevant_lines.loc[is_line].groupby(level=0)["geometry"].agg(LineString)
+    )
-    gdf.loc[is_relevant, "geometry"] = relevant_lines_mapped
+    gdf.loc[relevant_lines_mapped.index, "geometry"] = relevant_lines_mapped
     return gdf
@@ -255,7 +262,7 @@ def cut_lines(
         This method is time consuming for large networks and low 'max_length'.
     Examples:
-    --------
+    ---------
     >>> from sgis import read_parquet_url, cut_lines
     >>> roads = read_parquet_url("https://media.githubusercontent.com/media/statisticsnorway/ssb-sgis/main/tests/testdata/roads_oslo_2022.parquet")
     >>> roads.length.describe().round(1)
@@ -327,7 +334,7 @@ def cut_lines_once(
             Defaults to False.
     Examples:
-    --------
+    ---------
     >>> from sgis import cut_lines_once, to_gdf
     >>> import pandas as pd
     >>> from shapely.geometry import LineString

sgis/networkanalysis/directednetwork.py CHANGED Viewed

@@ -29,7 +29,7 @@ def make_directed_network_norway(gdf: GeoDataFrame, dropnegative: bool) -> GeoDa
             to keep them.
     Examples:
-    --------
+    ---------
     2022 data for the municipalities of Oslo and Eidskog can be read directly like this:
     >>> import sgis as sg

sgis/networkanalysis/finding_isolated_networks.py CHANGED Viewed

@@ -1,6 +1,7 @@
 """Functions for Finding network components in a GeoDataFrame of lines."""
 import networkx as nx
+import pandas as pd
 from geopandas import GeoDataFrame
 from .nodes import make_node_ids
@@ -23,7 +24,7 @@ def get_connected_components(gdf: GeoDataFrame) -> GeoDataFrame:
         The GeoDataFrame with a new column "connected".
     Examples:
-    --------
+    ---------
     >>> from sgis import read_parquet_url, get_connected_components
     >>> roads = read_parquet_url("https://media.githubusercontent.com/media/statisticsnorway/ssb-sgis/main/tests/testdata/roads_oslo_2022.parquet")
@@ -76,12 +77,12 @@ def get_component_size(gdf: GeoDataFrame) -> GeoDataFrame:
         A GeoDataFrame with a new column "component_size".
     Examples:
-    --------
+    ---------
     >>> from sgis import read_parquet_url, get_component_size
     >>> roads = read_parquet_url("https://media.githubusercontent.com/media/statisticsnorway/ssb-sgis/main/tests/testdata/roads_oslo_2022.parquet")
     >>> roads = get_component_size(roads)
-    >>> roads.component_size.value_counts().head()
+    >>> roads["component_size"].value_counts().head()
     component_size
     79180    85638
     2         1601
@@ -101,11 +102,17 @@ def get_component_size(gdf: GeoDataFrame) -> GeoDataFrame:
     graph.add_edges_from(edges)
     components = [list(x) for x in nx.connected_components(graph)]
-    componentsdict = {
-        idx: len(component) for component in components for idx in component
-    }
-    gdf["component_size"] = gdf.source.map(componentsdict)
+    mapper = pd.DataFrame(
+        {
+            idx: [i, len(component)]
+            for i, component in enumerate(components)
+            for idx in component
+        },
+    ).transpose()
+    mapper.columns = ["component_index", "component_size"]
+    gdf["component_index"] = gdf["source"].map(mapper["component_index"])
+    gdf["component_size"] = gdf["source"].map(mapper["component_size"])
     gdf = gdf.drop(
         ["source_wkt", "target_wkt", "source", "target", "n_source", "n_target"], axis=1

ssb-sgis 1.0.2__py3-none-any.whl → 1.0.4__py3-none-any.whl

ssb-sgis 1.0.2py3-none-any.whl → 1.0.4py3-none-any.whl