PyPI - ssb-sgis - Versions diffs - 1.0.2__py3-none-any.whl → 1.0.4__py3-none-any.whl - Mend

ssb-sgis 1.0.2py3-none-any.whl → 1.0.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (50) hide show

sgis/__init__.py +20 -9
sgis/debug_config.py +24 -0
sgis/exceptions.py +2 -2
sgis/geopandas_tools/bounds.py +33 -36
sgis/geopandas_tools/buffer_dissolve_explode.py +136 -35
sgis/geopandas_tools/centerlines.py +4 -91
sgis/geopandas_tools/cleaning.py +1576 -583
sgis/geopandas_tools/conversion.py +38 -19
sgis/geopandas_tools/duplicates.py +29 -8
sgis/geopandas_tools/general.py +263 -100
sgis/geopandas_tools/geometry_types.py +4 -4
sgis/geopandas_tools/neighbors.py +19 -15
sgis/geopandas_tools/overlay.py +2 -2
sgis/geopandas_tools/point_operations.py +5 -5
sgis/geopandas_tools/polygon_operations.py +510 -105
sgis/geopandas_tools/polygons_as_rings.py +40 -8
sgis/geopandas_tools/sfilter.py +29 -12
sgis/helpers.py +3 -3
sgis/io/dapla_functions.py +238 -19
sgis/io/read_parquet.py +1 -1
sgis/maps/examine.py +27 -12
sgis/maps/explore.py +450 -65
sgis/maps/legend.py +177 -76
sgis/maps/map.py +206 -103
sgis/maps/maps.py +178 -105
sgis/maps/thematicmap.py +243 -83
sgis/networkanalysis/_service_area.py +6 -1
sgis/networkanalysis/closing_network_holes.py +2 -2
sgis/networkanalysis/cutting_lines.py +15 -8
sgis/networkanalysis/directednetwork.py +1 -1
sgis/networkanalysis/finding_isolated_networks.py +15 -8
sgis/networkanalysis/networkanalysis.py +17 -19
sgis/networkanalysis/networkanalysisrules.py +1 -1
sgis/networkanalysis/traveling_salesman.py +1 -1
sgis/parallel/parallel.py +64 -27
sgis/raster/__init__.py +0 -6
sgis/raster/base.py +208 -0
sgis/raster/cube.py +54 -8
sgis/raster/image_collection.py +3257 -0
sgis/raster/indices.py +17 -5
sgis/raster/raster.py +138 -243
sgis/raster/sentinel_config.py +120 -0
sgis/raster/zonal.py +0 -1
{ssb_sgis-1.0.2.dist-info → ssb_sgis-1.0.4.dist-info}/METADATA +6 -7
ssb_sgis-1.0.4.dist-info/RECORD +62 -0
sgis/raster/methods_as_functions.py +0 -0
sgis/raster/torchgeo.py +0 -171
ssb_sgis-1.0.2.dist-info/RECORD +0 -61
{ssb_sgis-1.0.2.dist-info → ssb_sgis-1.0.4.dist-info}/LICENSE +0 -0
{ssb_sgis-1.0.2.dist-info → ssb_sgis-1.0.4.dist-info}/WHEEL +0 -0

sgis/geopandas_tools/conversion.py CHANGED Viewed

@@ -90,8 +90,10 @@ def to_shapely(obj: Any) -> Geometry:
         return obj
     if not hasattr(obj, "__iter__"):
         raise TypeError(type(obj))
-    if hasattr(obj, "unary_union"):
-        return obj.unary_union
+    try:
+        return shapely.union_all(obj.geometry.values)
+    except AttributeError:
+        pass
     try:
         return Point(*obj)
     except TypeError:
@@ -108,6 +110,7 @@ def to_shapely(obj: Any) -> Geometry:
         return shapely.wkb.loads(obj)
     except TypeError:
         pass
+    raise TypeError(type(obj), obj)
 def to_bbox(
@@ -122,25 +125,41 @@ def to_bbox(
             "xmin", "ymin", "xmax", "ymax".
     """
     if isinstance(obj, (GeoDataFrame, GeoSeries)):
-        return tuple(obj.total_bounds)
-    if isinstance(obj, Geometry):
-        return tuple(obj.bounds)
+        bounds = tuple(obj.total_bounds)
+        assert isinstance(bounds, tuple)
+        return bounds
+    try:
+        bounds = tuple(obj.bounds)
+        assert isinstance(bounds, tuple)
+        return bounds
+    except Exception:
+        pass
     try:
-        minx = int(np.min(obj["minx"]))  # type: ignore [index]
-        miny = int(np.min(obj["miny"]))  # type: ignore [index]
-        maxx = int(np.max(obj["maxx"]))  # type: ignore [index]
-        maxy = int(np.max(obj["maxy"]))  # type: ignore [index]
+        minx = float(np.min(obj["minx"]))  # type: ignore [index]
+        miny = float(np.min(obj["miny"]))  # type: ignore [index]
+        maxx = float(np.max(obj["maxx"]))  # type: ignore [index]
+        maxy = float(np.max(obj["maxy"]))  # type: ignore [index]
         return minx, miny, maxx, maxy
     except Exception:
-        try:
-            minx = int(np.min(obj.minx))  # type: ignore [union-attr]
-            miny = int(np.min(obj.miny))  # type: ignore [union-attr]
-            maxx = int(np.max(obj.maxx))  # type: ignore [union-attr]
-            maxy = int(np.max(obj.maxy))  # type: ignore [union-attr]
-            return minx, miny, maxx, maxy
-        except Exception:
-            pass
+        pass
+    try:
+        minx = float(np.min(obj.minx))  # type: ignore [union-attr]
+        miny = float(np.min(obj.miny))  # type: ignore [union-attr]
+        maxx = float(np.max(obj.maxx))  # type: ignore [union-attr]
+        maxy = float(np.max(obj.maxy))  # type: ignore [union-attr]
+        return minx, miny, maxx, maxy
+    except Exception:
+        pass
+    try:
+        minx = float(np.min(obj["west_longitude"]))  # type: ignore [index]
+        miny = float(np.min(obj["south_latitude"]))  # type: ignore [index]
+        maxx = float(np.max(obj["east_longitude"]))  # type: ignore [index]
+        maxy = float(np.max(obj["north_latitude"]))  # type: ignore [index]
+        return minx, miny, maxx, maxy
+    except Exception:
+        pass
     if hasattr(obj, "geometry"):
         try:
@@ -195,7 +214,7 @@ def coordinate_array(
         np.ndarray of np.ndarrays of coordinates.
     Examples:
-    --------
+    ---------
     >>> import sgis as sg
     >>> points = sg.to_gdf(
     ...     [
@@ -279,7 +298,7 @@ def to_gdf(
         A GeoDataFrame with one column, the geometry column.
     Examples:
-    --------
+    ---------
     >>> import sgis as sg
     >>> coords = (10, 60)
     >>> sg.to_gdf(coords, crs=4326)

sgis/geopandas_tools/duplicates.py CHANGED Viewed

@@ -8,10 +8,10 @@ from shapely import STRtree
 from shapely import difference
 from shapely import make_valid
 from shapely import simplify
-from shapely import unary_union
 from shapely.errors import GEOSException
 from .general import _determine_geom_type_args
+from .general import _grouped_unary_union
 from .general import _parallel_unary_union_geoseries
 from .general import _push_geom_col
 from .general import clean_geoms
@@ -54,7 +54,7 @@ def update_geometries(
         predicate: Spatial predicate for the spatial tree.
     Example:
-    ------
+    --------
     Create two circles and get the overlap.
     >>> import sgis as sg
@@ -125,10 +125,8 @@ def update_geometries(
     else:
         only_one = erasers.groupby(level=0).transform("size") == 1
         one_hit = erasers[only_one]
-        many_hits = (
-            erasers[~only_one]
-            .groupby(level=0)
-            .agg(lambda x: make_valid(unary_union(x, grid_size=grid_size)))
+        many_hits = _grouped_unary_union(
+            erasers[~only_one], level=0, grid_size=grid_size
         )
         erasers = pd.concat([one_hit, many_hits]).sort_index()
@@ -213,7 +211,7 @@ def get_intersections(
         A GeoDataFrame of the overlapping polygons.
     Examples:
-    --------
+    ---------
     Create three partially overlapping polygons.
     >>> import sgis as sg
@@ -357,10 +355,33 @@ def _get_intersecting_geometries(
     duplicated_points = points_joined.loc[points_joined.index.duplicated(keep=False)]
-    return intersected.loc[intersected.index.isin(duplicated_points.index)].drop(
+    out = intersected.loc[intersected.index.isin(duplicated_points.index)].drop(
         columns=["idx_left", "idx_right"]
     )
+    # some polygons within polygons are not counted in the
+    within = (
+        gdf.assign(_range_idx_inters_left=lambda x: range(len(x)))
+        .sjoin(
+            GeoDataFrame(
+                {
+                    "geometry": gdf.buffer(1e-6).values,
+                    "_range_idx_inters_right": range(len(gdf)),
+                },
+                crs=gdf.crs,
+            ),
+            how="inner",
+            predicate="within",
+        )
+        .loc[lambda x: x["_range_idx_inters_left"] != x["_range_idx_inters_right"]]
+        .drop(
+            columns=["index_right", "_range_idx_inters_left", "_range_idx_inters_right"]
+        )
+        .pipe(sfilter_inverse, out.buffer(-PRECISION))
+    )
+    return pd.concat([out, within])
 def _drop_duplicate_geometries(gdf: GeoDataFrame, **kwargs) -> GeoDataFrame:
     """Drop geometries that are considered equal.

sgis/geopandas_tools/general.py CHANGED Viewed

@@ -1,20 +1,23 @@
+import functools
+import itertools
 import numbers
 import warnings
 from collections.abc import Hashable
 from collections.abc import Iterable
 from typing import Any
-import dask_geopandas
 import joblib
 import numpy as np
 import pandas as pd
 import pyproj
+import shapely
 from geopandas import GeoDataFrame
 from geopandas import GeoSeries
 from geopandas.array import GeometryArray
 from geopandas.array import GeometryDtype
 from numpy.typing import NDArray
 from shapely import Geometry
+from shapely import extract_unique_points
 from shapely import get_coordinates
 from shapely import get_exterior_ring
 from shapely import get_interior_ring
@@ -23,10 +26,16 @@ from shapely import get_parts
 from shapely import linestrings
 from shapely import make_valid
 from shapely import points as shapely_points
-from shapely import unary_union
+from shapely import union_all
 from shapely.geometry import LineString
+from shapely.geometry import MultiPoint
 from shapely.geometry import Point
+from shapely.geometry import Polygon
+from .conversion import coordinate_array
+from .conversion import to_bbox
+from .conversion import to_gdf
+from .conversion import to_geoseries
 from .geometry_types import get_geom_type
 from .geometry_types import make_all_singlepart
 from .geometry_types import to_single_geom_type
@@ -34,7 +43,7 @@ from .geometry_types import to_single_geom_type
 def split_geom_types(gdf: GeoDataFrame | GeoSeries) -> tuple[GeoDataFrame | GeoSeries]:
     return tuple(
-        gdf.loc[gdf.geom_type == geom_type] for geom_type in gdf.geom_type.unique()
+        gdf[gdf.geom_type == geom_type] for geom_type in gdf.geom_type.unique()
     )
@@ -164,7 +173,7 @@ def clean_geoms(
         non-empty and not-NaN/-None geometries.
     Examples:
-    --------
+    ---------
     >>> import sgis as sg
     >>> import pandas as pd
     >>> from shapely import wkt
@@ -281,7 +290,7 @@ def sort_large_first(gdf: GeoDataFrame | GeoSeries) -> GeoDataFrame | GeoSeries:
         A GeoDataFrame or GeoSeries sorted from large to small in area.
     Examples:
-    --------
+    ---------
     Create GeoDataFrame with NaN values.
     >>> import sgis as sg
@@ -381,35 +390,27 @@ def sort_small_first(gdf: GeoDataFrame | GeoSeries) -> GeoDataFrame | GeoSeries:
 def make_lines_between_points(
-    arr1: NDArray[Point] | GeometryArray | GeoSeries,
-    arr2: NDArray[Point] | GeometryArray | GeoSeries,
+    *arrs: NDArray[Point] | GeometryArray | GeoSeries,
 ) -> NDArray[LineString]:
-    """Creates an array of linestrings from two arrays of points.
+    """Creates an array of linestrings from two or more arrays of points.
-    The operation is done rowwise.
+    The lines are created rowwise, meaning from arr0[0] to arr1[0], from arr0[1] to arr1[1]...
+    If more than two arrays are passed, e.g. three arrays,
+    the lines will go from arr0[0] via arr1[0] to arr2[0].
     Args:
-        arr1: GeometryArray og GeoSeries of points.
-        arr2: GeometryArray og GeoSeries of points of same length as arr1.
+        arrs: 1 dimensional arrays of point geometries.
+            All arrays must have the same shape.
+            Must be at least two arrays.
     Returns:
         A numpy array of linestrings.
-    Raises:
-        ValueError: If the arrays have unequal shape.
     """
-    if arr1.shape != arr2.shape:
-        raise ValueError("Arrays must have equal shape.")
-    coords: pd.DataFrame = pd.concat(
-        [
-            pd.DataFrame(get_coordinates(arr1), columns=["x", "y"]),
-            pd.DataFrame(get_coordinates(arr2), columns=["x", "y"]),
-        ]
-    ).sort_index()
-    return linestrings(coords.values, indices=coords.index)
+    coords = [get_coordinates(arr, return_index=False) for arr in arrs]
+    return linestrings(
+        np.concatenate([coords_arr[:, None, :] for coords_arr in coords], axis=1)
+    )
 def random_points(n: int, loc: float | int = 0.5) -> GeoDataFrame:
@@ -423,7 +424,7 @@ def random_points(n: int, loc: float | int = 0.5) -> GeoDataFrame:
         A GeoDataFrame of points with n rows.
     Examples:
-    --------
+    ---------
     >>> import sgis as sg
     >>> points = sg.random_points(10_000)
     >>> points
@@ -523,7 +524,7 @@ def to_lines(*gdfs: GeoDataFrame, copy: bool = True) -> GeoDataFrame:
         always ignores the index.
     Examples:
-    --------
+    ---------
     Convert single polygon to linestring.
     >>> import sgis as sg
@@ -559,7 +560,9 @@ def to_lines(*gdfs: GeoDataFrame, copy: bool = True) -> GeoDataFrame:
         raise TypeError("gdf must be GeoDataFrame or GeoSeries")
     if any(gdf.geom_type.isin(["Point", "MultiPoint"]).any() for gdf in gdfs):
-        raise ValueError("Cannot convert points to lines.")
+        raise ValueError(
+            f"Cannot convert points to lines. {[gdf.geom_type.value_counts() for gdf in gdfs]}"
+        )
     def _shapely_geometry_to_lines(geom):
         """Get all lines from the exterior and interiors of a Polygon."""
@@ -583,7 +586,7 @@ def to_lines(*gdfs: GeoDataFrame, copy: bool = True) -> GeoDataFrame:
             lines += interior_rings
-        return unary_union(lines)
+        return union_all(lines)
     lines = []
     for gdf in gdfs:
@@ -673,6 +676,162 @@ def clean_clip(
     return gdf
+def extend_lines(arr1, arr2, distance) -> NDArray[LineString]:
+    if len(arr1) != len(arr2):
+        raise ValueError
+    if not len(arr1):
+        return arr1
+    arr1, arr2 = arr2, arr1  # TODO fix
+    coords1 = coordinate_array(arr1)
+    coords2 = coordinate_array(arr2)
+    dx = coords2[:, 0] - coords1[:, 0]
+    dy = coords2[:, 1] - coords1[:, 1]
+    len_xy = np.sqrt((dx**2.0) + (dy**2.0))
+    x = coords1[:, 0] + (coords1[:, 0] - coords2[:, 0]) / len_xy * distance
+    y = coords1[:, 1] + (coords1[:, 1] - coords2[:, 1]) / len_xy * distance
+    new_points = np.array([None for _ in range(len(arr1))])
+    new_points[~np.isnan(x)] = shapely.points(x[~np.isnan(x)], y[~np.isnan(x)])
+    new_points[~np.isnan(x)] = make_lines_between_points(
+        arr2[~np.isnan(x)], new_points[~np.isnan(x)]
+    )
+    return new_points
+def multipoints_to_line_segments_numpy(
+    points: GeoSeries | NDArray[MultiPoint] | MultiPoint,
+    cycle: bool = False,
+) -> list[LineString]:
+    try:
+        arr = get_parts(points.geometry.values)
+    except AttributeError:
+        arr = get_parts(points)
+    line_between_last_and_first = [LineString([arr[-1], arr[0]])] if cycle else []
+    return [
+        LineString([p0, p1]) for p0, p1 in itertools.pairwise(arr)
+    ] + line_between_last_and_first
+def multipoints_to_line_segments(
+    multipoints: GeoSeries | GeoDataFrame, cycle: bool = True  # to_next: bool = True,
+) -> GeoSeries | GeoDataFrame:
+    if not len(multipoints):
+        return multipoints
+    if isinstance(multipoints, GeoDataFrame):
+        df = multipoints.drop(columns=multipoints.geometry.name)
+        multipoints = multipoints.geometry
+        was_gdf = True
+    else:
+        multipoints = to_geoseries(multipoints)
+        was_gdf = False
+    multipoints = to_geoseries(multipoints)
+    segs = pd.Series(
+        [
+            multipoints_to_line_segments_numpy(geoms, cycle=cycle)
+            for geoms in multipoints
+        ],
+        index=multipoints.index,
+    ).explode()
+    segs = GeoSeries(segs, crs=multipoints.crs, name=multipoints.name)
+    if was_gdf:
+        return GeoDataFrame(df.join(segs), geometry=segs.name, crs=segs.crs)
+    else:
+        return segs
+def get_line_segments(
+    lines: GeoDataFrame | GeoSeries, extract_unique: bool = False, cycle=False
+) -> GeoDataFrame:
+    try:
+        assert lines.index.is_unique
+    except AttributeError:
+        pass
+    if isinstance(lines, GeoDataFrame):
+        df = lines.drop(columns=lines.geometry.name)
+        lines = lines.geometry
+        was_gdf = True
+    else:
+        lines = to_geoseries(lines)
+        was_gdf = False
+    partial_segs_func = functools.partial(
+        multipoints_to_line_segments_numpy, cycle=cycle
+    )
+    if extract_unique:
+        points = extract_unique_points(lines.geometry.values)
+        segs = pd.Series(
+            [partial_segs_func(geoms) for geoms in points],
+            index=lines.index,
+        ).explode()
+    else:
+        coords, indices = shapely.get_coordinates(lines, return_index=True)
+        points = GeoSeries(shapely.points(coords), index=indices)
+        index_mapper = {
+            i: idx
+            for i, idx in zip(
+                np.unique(indices), lines.index.drop_duplicates(), strict=True
+            )
+        }
+        points.index = points.index.map(index_mapper)
+        segs = points.groupby(level=0).agg(partial_segs_func).explode()
+    segs = GeoSeries(segs, crs=lines.crs, name=lines.name)
+    if was_gdf:
+        return GeoDataFrame(df.join(segs), geometry=segs.name, crs=lines.crs)
+    else:
+        return segs
+def get_index_right_columns(gdf: pd.DataFrame | pd.Series) -> list[str]:
+    """Get a list of what will be the resulting columns in an sjoin."""
+    if gdf.index.name is None and all(name is None for name in gdf.index.names):
+        if gdf.index.nlevels == 1:
+            return ["index_right"]
+        else:
+            return [f"index_right{i}" for i in range(gdf.index.nlevels)]
+    else:
+        return gdf.index.names
+def points_in_bounds(
+    gdf: GeoDataFrame | GeoSeries, gridsize: int | float
+) -> GeoDataFrame:
+    """Get a GeoDataFrame of points within the bounds of the GeoDataFrame."""
+    minx, miny, maxx, maxy = to_bbox(gdf)
+    try:
+        crs = gdf.crs
+    except AttributeError:
+        crs = None
+    xs = np.linspace(minx, maxx, num=int((maxx - minx) / gridsize))
+    ys = np.linspace(miny, maxy, num=int((maxy - miny) / gridsize))
+    x_coords, y_coords = np.meshgrid(xs, ys, indexing="ij")
+    coords = np.concatenate((x_coords.reshape(-1, 1), y_coords.reshape(-1, 1)), axis=1)
+    return to_gdf(coords, crs=crs)
+def points_in_polygons(
+    gdf: GeoDataFrame | GeoSeries, gridsize: int | float
+) -> GeoDataFrame:
+    index_right_col = get_index_right_columns(gdf)
+    out = points_in_bounds(gdf, gridsize).sjoin(gdf).set_index(index_right_col)
+    out.index.name = gdf.index.name
+    return out.sort_index()
 def _determine_geom_type_args(
     gdf: GeoDataFrame, geom_type: str | None, keep_geom_type: bool | None
 ) -> tuple[GeoDataFrame, str, bool]:
@@ -692,65 +851,93 @@ def _determine_geom_type_args(
     return gdf, geom_type, keep_geom_type
-def _merge_geometries(geoms: GeoSeries, grid_size=None) -> Geometry:
-    return make_valid(unary_union(geoms, grid_size=grid_size))
+def _unary_union_for_notna(geoms, **kwargs):
+    try:
+        return make_valid(union_all(geoms, **kwargs))
+    except TypeError:
+        return union_all([geom for geom in geoms.dropna().values], **kwargs)
+def _grouped_unary_union(
+    df: GeoDataFrame | GeoSeries | pd.DataFrame | pd.Series,
+    by: str | list[str] | None = None,
+    level: int | None = None,
+    as_index: bool = True,
+    grid_size: float | int | None = None,
+    dropna: bool = False,
+    **kwargs,
+) -> GeoSeries | GeoDataFrame:
+    """Vectorized unary_union for groups.
+    Experimental. Messy code.
+    """
+    df = df.copy()
+    df_orig = df.copy()
-def _parallel_unary_union(
-    gdf: GeoDataFrame, n_jobs: int = 1, by=None, grid_size=None, **kwargs
-) -> list[Geometry]:
     try:
-        geom_col = gdf._geometry_column_name
+        geom_col = df._geometry_column_name
     except AttributeError:
-        geom_col = "geometry"
-    if by is not None and not isinstance(by, str):
-        gdf = gdf.copy()
         try:
-            gdf["_by"] = gdf[by].astype(str).agg("-".join, axis=1)
-        except KeyError:
-            gdf["_by"] = by
-        by = "_by"
+            geom_col = df.name
+            if geom_col is None:
+                geom_col = "geometry"
+        except AttributeError:
+            geom_col = "geometry"
-    if gdf.crs is None:
-        gdf.crs = 25833
-        _was_none = True
-    else:
-        _was_none = False
+    if not len(df):
+        return GeoSeries(name=geom_col)
-    if isinstance(gdf.index, pd.MultiIndex):
-        gdf = gdf.reset_index(drop=True)
+    if isinstance(df, pd.Series):
+        df.name = geom_col
+        original_index = df.index
+        df = df.reset_index()
+        df.index = original_index
-    dissolved = (
-        dask_geopandas.from_geopandas(gdf, npartitions=n_jobs).dissolve(by).compute()
-    )
-    if _was_none:
-        dissolved.crs = None
+    if isinstance(by, str):
+        by = [by]
+    elif by is None and level is None:
+        raise TypeError("You have to supply one of 'by' and 'level'")
+    elif by is None:
+        by = df.index.get_level_values(level)
-    return dissolved.geometry
+    cumcount = df.groupby(by, dropna=dropna).cumcount().values
+    def get_col_or_index(df, col: str) -> pd.Series | pd.Index:
+        try:
+            return df[col]
+        except KeyError:
+            for i, name in enumerate(df.index.names):
+                if name == col:
+                    return df.index.get_level_values(i)
+        raise KeyError(col)
-def _parallel_unary_union_geoseries(
-    ser: GeoSeries, n_jobs: int = 1, grid_size=None, **kwargs
-) -> list[Geometry]:
-    if ser.crs is None:
-        ser.crs = 25833
-        _was_none = True
-    else:
-        _was_none = False
+    try:
+        df.index = pd.MultiIndex.from_arrays(
+            [cumcount, *[get_col_or_index(df, col) for col in by]]
+        )
+    except KeyError:
+        df.index = pd.MultiIndex.from_arrays([cumcount, by])
+    # to wide format: each row will be one group to be merged to one geometry
+    try:
+        geoms_wide: pd.DataFrame = df[geom_col].unstack(level=0)
+    except Exception as e:
+        bb = [*by, geom_col]
+        raise e.__class__(e, f"by={by}", df_orig[bb], df[geom_col]) from e
+    geometries_2d: NDArray[Polygon | None] = geoms_wide.values
+    try:
+        geometries_2d = make_valid(geometries_2d)
+    except TypeError:
+        # make_valid doesn't like nan, so converting to None
+        # np.isnan doesn't accept geometry type, so using isinstance
+        np_isinstance = np.vectorize(isinstance)
+        geometries_2d[np_isinstance(geometries_2d, Geometry) == False] = None
-    if isinstance(ser.index, pd.MultiIndex):
-        ser = ser.reset_index(drop=True)
+    unioned = make_valid(union_all(geometries_2d, axis=1, **kwargs))
-    dissolved = (
-        dask_geopandas.from_geopandas(ser.to_frame("geometry"), npartitions=n_jobs)
-        .dissolve(**kwargs)
-        .compute()
-    )
-    if _was_none:
-        dissolved.crs = None
+    geoms = GeoSeries(unioned, name=geom_col, index=geoms_wide.index)
-    return dissolved.geometry
+    return geoms if as_index else geoms.reset_index()
 def _parallel_unary_union(
@@ -765,36 +952,12 @@ def _parallel_unary_union(
         delayed_operations = []
         for _, geoms in gdf.groupby(by, **kwargs)[geom_col]:
             delayed_operations.append(
-                joblib.delayed(_merge_geometries)(geoms, grid_size=grid_size)
+                joblib.delayed(_unary_union_for_notna)(geoms, grid_size=grid_size)
             )
         return parallel(delayed_operations)
-def _parallel_unary_union_geoseries(
-    ser: GeoSeries, n_jobs: int = 1, grid_size=None, **kwargs
-) -> list[Geometry]:
-    is_one_hit = ser.groupby(**kwargs).transform("size") == 1
-    one_hit = ser.loc[is_one_hit]
-    many_hits = ser.loc[~is_one_hit]
-    with joblib.Parallel(n_jobs=n_jobs, backend="threading") as parallel:
-        delayed_operations = []
-        for _, geoms in many_hits.groupby(**kwargs):
-            delayed_operations.append(
-                joblib.delayed(_merge_geometries)(geoms, grid_size=grid_size)
-            )
-        dissolved = pd.Series(
-            parallel(delayed_operations),
-            index=is_one_hit[lambda x: x is False].index.unique(),
-        )
-    return pd.concat([dissolved, one_hit]).sort_index().values
 def _parallel_unary_union_geoseries(
     ser: GeoSeries, n_jobs: int = 1, grid_size=None, **kwargs
 ) -> list[Geometry]:
@@ -803,7 +966,7 @@ def _parallel_unary_union_geoseries(
         delayed_operations = []
         for _, geoms in ser.groupby(**kwargs):
             delayed_operations.append(
-                joblib.delayed(_merge_geometries)(geoms, grid_size=grid_size)
+                joblib.delayed(_unary_union_for_notna)(geoms, grid_size=grid_size)
             )
         return parallel(delayed_operations)

ssb-sgis 1.0.2__py3-none-any.whl → 1.0.4__py3-none-any.whl

ssb-sgis 1.0.2py3-none-any.whl → 1.0.4py3-none-any.whl