PyPI - ssb-sgis - Versions diffs - 0.1.5__py3-none-any.whl → 0.1.6__py3-none-any.whl - Mend

ssb-sgis 0.1.5py3-none-any.whl → 0.1.6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (19) hide show

sgis/geopandas_tools/general.py +3 -5
sgis/geopandas_tools/geometry_types.py +1 -1
sgis/geopandas_tools/line_operations.py +1 -1
sgis/maps/explore.py +0 -85
sgis/maps/legend.py +5 -5
sgis/maps/maps.py +5 -1
sgis/maps/thematicmap.py +35 -10
sgis/networkanalysis/_get_route.py +168 -114
sgis/networkanalysis/_od_cost_matrix.py +7 -9
sgis/networkanalysis/_points.py +0 -18
sgis/networkanalysis/directednetwork.py +2 -2
sgis/networkanalysis/network.py +16 -25
sgis/networkanalysis/networkanalysis.py +301 -123
sgis/networkanalysis/networkanalysisrules.py +2 -2
{ssb_sgis-0.1.5.dist-info → ssb_sgis-0.1.6.dist-info}/METADATA +15 -7
ssb_sgis-0.1.6.dist-info/RECORD +35 -0
ssb_sgis-0.1.5.dist-info/RECORD +0 -35
{ssb_sgis-0.1.5.dist-info → ssb_sgis-0.1.6.dist-info}/LICENSE +0 -0
{ssb_sgis-0.1.5.dist-info → ssb_sgis-0.1.6.dist-info}/WHEEL +0 -0

sgis/networkanalysis/networkanalysis.py CHANGED Viewed

@@ -18,12 +18,12 @@ from pandas import DataFrame
 from ..geopandas_tools.general import _push_geom_col
 from ..geopandas_tools.line_operations import split_lines_by_nearest_point
-from ._get_route import _get_route
+from ._get_route import _get_k_routes, _get_route, _get_route_frequencies
 from ._od_cost_matrix import _od_cost_matrix
 from ._points import Destinations, Origins
 from ._service_area import _service_area
 from .directednetwork import DirectedNetwork
-from .network import Network, _edge_ids
+from .network import Network
 from .networkanalysisrules import NetworkAnalysisRules
@@ -71,24 +71,24 @@ class NetworkAnalysis:
     See also
     --------
-    DirectedNetwork : for customising and optimising line data before directed network
+    DirectedNetwork : For customising and optimising line data before directed network
         analysis.
-    Network : for customising and optimising line data before undirected network
+    Network : For customising and optimising line data before undirected network
         analysis.
     Examples
     --------
     Read example data.
-    >>> from sgis import read_parquet_url
-    >>> roads = read_parquet_url("https://media.githubusercontent.com/media/statisticsnorway/ssb-sgis/main/tests/testdata/roads_eidskog_2022.parquet")
-    >>> points = read_parquet_url("https://media.githubusercontent.com/media/statisticsnorway/ssb-sgis/main/tests/testdata/points_eidskog.parquet")
+    >>> import sgis as sg
+    >>> roads = sg.read_parquet_url("https://media.githubusercontent.com/media/statisticsnorway/ssb-sgis/main/tests/testdata/roads_eidskog_2022.parquet")
+    >>> points = sg.read_parquet_url("https://media.githubusercontent.com/media/statisticsnorway/ssb-sgis/main/tests/testdata/points_eidskog.parquet")
     Creating a NetworkAnalysis class instance.
-    >>> from sgis import DirectedNetwork, NetworkAnalysisRules, NetworkAnalysis
     >>> nw = (
-    ...     DirectedNetwork(roads)
+    ...     sg.DirectedNetwork(roads)
     ...     .remove_isolated()
     ...     .make_directed_network(
     ...         direction_col="oneway",
@@ -96,12 +96,13 @@ class NetworkAnalysis:
     ...         minute_cols=("drivetime_fw", "drivetime_bw"),
     ...     )
     ... )
-    >>> rules = NetworkAnalysisRules(weight="minutes")
-    >>> nwa = NetworkAnalysis(network=nw, rules=rules, detailed_log=False)
+    >>> rules = sg.NetworkAnalysisRules(weight="minutes")
+    >>> nwa = sg.NetworkAnalysis(network=nw, rules=rules, detailed_log=False)
     >>> nwa
     NetworkAnalysis(
         network=DirectedNetwork(6364 km, percent_bidirectional=87),
-        rules=NetworkAnalysisRules(weight='minutes', search_tolerance=250, search_factor=10, split_lines=False, ...)
+        rules=NetworkAnalysisRules(weight='minutes', search_tolerance=250, search_factor=10, split_lines=False, ...),
+        log=True, detailed_log=True,
     )
     od_cost_matrix: fast many-to-many travel time/distance calculation.
@@ -120,7 +121,6 @@ class NetworkAnalysis:
     999997     999          997  10.288465
     999998     999          998  14.798257
     999999     999          999   0.000000
     [1000000 rows x 3 columns]
     get_route: get the geometry of the routes.
@@ -139,7 +139,6 @@ class NetworkAnalysis:
     97     606          901  16.998595  MULTILINESTRING Z ((265040.505 6641218.021 100...
     98     606          766  10.094371  MULTILINESTRING Z ((265639.400 6649020.000 85....
     99     606          320   7.317098  MULTILINESTRING Z ((262711.480 6648807.500 3.8...
     [100 rows x 4 columns]
     get_route_frequencies: get the number of times each line segment was used.
@@ -147,19 +146,19 @@ class NetworkAnalysis:
     >>> frequencies = nwa.get_route_frequencies(points.sample(25), points.sample(25))
     >>> frequencies[[["source", "target", "frequency", "geometry"]]
            source target  frequency                                           geometry
-    116897  28500  13496        1.0  LINESTRING Z (256638.500 6653339.300 153.857, ...
-    155781  23913  23908        1.0  LINESTRING Z (256843.774 6653563.678 143.702, ...
-    155780  76957  23913        1.0  LINESTRING Z (256866.300 6653559.400 142.457, ...
-    155779  76956  76957        1.0  LINESTRING Z (256875.300 6653557.100 142.157, ...
-    155778  74816  76956        1.0  LINESTRING Z (256882.738 6653554.580 141.657, ...
+    160188  77264  79112        1.0  LINESTRING Z (268641.225 6651871.624 111.355, ...
+    138956  30221  45403        1.0  LINESTRING Z (273091.100 6652396.000 170.471, ...
+    138958  30224  30221        1.0  LINESTRING Z (273117.500 6652391.500 169.771, ...
+    138960  16513  30224        1.0  LINESTRING Z (273176.813 6652379.896 169.414, ...
+    138962  40610  16513        1.0  LINESTRING Z (273207.300 6652372.100 168.871, ...
     ...       ...    ...        ...                                                ...
-    156631  77375  77374       90.0  LINESTRING Z (265454.387 6651000.044 88.806, 2...
-    149793  72649  77375       90.0  LINESTRING Z (265455.009 6651007.750 88.612, 2...
-    158249  78124  78123       95.0  LINESTRING Z (265563.150 6650547.620 89.382, 2...
-    158248  78123  72820       95.0  LINESTRING Z (265567.158 6650542.836 89.522, 2...
-    156601  77353  78124       95.0  LINESTRING Z (265530.470 6650587.640 88.527, 2...
+    151464  73800  73801      108.0  LINESTRING Z (265362.800 6647137.100 131.660, ...
+    151465  73801  73802      108.0  LINESTRING Z (265368.600 6647142.900 131.660, ...
+    151466  73802  73632      108.0  LINESTRING Z (265371.400 6647147.900 131.660, ...
+    151463  73799  73800      129.0  LINESTRING Z (265359.600 6647135.400 131.660, ...
+    152170  74418  74246      135.0  LINESTRING Z (264579.835 6651954.573 113.209, ...
-    [9268 rows x 4 columns]
+    [8915 rows x 4 columns]
     service_area: get the area that can be reached within one or more breaks.
@@ -187,8 +186,8 @@ class NetworkAnalysis:
     1 2023-03-29 15:20:21              0.5              get_route             10                10.0           0.0000  15.001443              True  ...  10.093613   14.641413  19.725085  6.869095    NaN   False        NaN       NaN
     2 2023-03-29 15:20:40              0.3  get_route_frequencies             25                25.0           0.0000   0.067199              True  ...   0.013309    0.038496   0.085692  0.087247    NaN     NaN        NaN       NaN
     3 2023-03-29 15:20:50              0.2           service_area              3                 NaN           0.0000  10.000000              True  ...   5.000000   10.000000  15.000000  4.330127    NaN     NaN  5, 10, 15      True
     [4 rows x 23 columns]
     """
     def __init__(
@@ -274,15 +273,19 @@ class NetworkAnalysis:
         Examples
         --------
+        Create the NetworkAnalysis instance.
+        >>> import sgis as sg
+        >>> roads = sg.read_parquet_url("https://media.githubusercontent.com/media/statisticsnorway/ssb-sgis/main/tests/testdata/roads_eidskog_2022.parquet")
+        >>> nw = sg.DirectedNetwork(roads).remove_isolated().make_directed_network_norway()
+        >>> rules = sg.NetworkAnalysisRules(weight="minutes")
+        >>> nwa = sg.NetworkAnalysis(network=nw, rules=rules, detailed_log=False)
         Create some origin and destination points.
-        See the class examples for how to prepare the network.
-        import sgis as sg
-        >>> points = sg.read_parquet_url(
-        ...     "https://media.githubusercontent.com/media/statisticsnorway/ssb-sgis/main/tests/testdata/points_oslo.parquet"
-        ... )
+        >>> points = sg.read_parquet_url("https://media.githubusercontent.com/media/statisticsnorway/ssb-sgis/main/tests/testdata/points_oslo.parquet")
-        >>> origins = points.loc[:99]
+        >>> origins = points.loc[:99, ["geometry"]]
         >>> origins
                                   geometry
         0   POINT (263122.700 6651184.900)
@@ -296,10 +299,9 @@ class NetworkAnalysis:
         97  POINT (263162.000 6650732.200)
         98  POINT (272322.700 6653729.100)
         99  POINT (265622.800 6644644.200)
         [100 rows x 1 columns]
-        >>> destinations = points.loc[100:199]
+        >>> destinations = points.loc[100:199, ["geometry"]]
         >>> destinations
                                    geometry
         100  POINT (265997.900 6647899.400)
@@ -313,7 +315,6 @@ class NetworkAnalysis:
         197  POINT (273135.300 6653198.100)
         198  POINT (270582.300 6652163.800)
         199  POINT (264980.800 6647231.300)
         [100 rows x 1 columns]
         Travel time from 100 to 100 points.
@@ -332,7 +333,6 @@ class NetworkAnalysis:
         9997      99          197  19.977029
         9998      99          198  15.233163
         9999      99          199   6.439002
         [10000 rows x 3 columns]
         Join the results onto the 'origins' GeoDataFrame via the index.
@@ -351,7 +351,6 @@ class NetworkAnalysis:
         99  POINT (265622.800 6644644.200)          197  19.977029
         99  POINT (265622.800 6644644.200)          198  15.233163
         99  POINT (265622.800 6644644.200)          199   6.439002
         [10000 rows x 3 columns]
         Get travel times below 10 minutes.
@@ -371,7 +370,6 @@ class NetworkAnalysis:
         99  POINT (265622.800 6644644.200)        177.0  5.944194
         99  POINT (265622.800 6644644.200)        183.0  8.449906
         99  POINT (265622.800 6644644.200)        199.0  6.439002
         [2195 rows x 3 columns]
         Get the three fastest routes from each origin.
@@ -391,7 +389,6 @@ class NetworkAnalysis:
         99  POINT (265622.800 6644644.200)        102.0  1.648705
         99  POINT (265622.800 6644644.200)        134.0  1.116209
         99  POINT (265622.800 6644644.200)        156.0  1.368926
         [294 rows x 3 columns]
         Assign aggregated values directly onto the origins via the index.
@@ -410,6 +407,7 @@ class NetworkAnalysis:
         97  POINT (263162.000 6650732.200)     11.904372
         98  POINT (272322.700 6653729.100)     17.579399
         99  POINT (265622.800 6644644.200)     12.185800
+        [100 rows x 2 columns]
         Use set_index to use column as identifier insted of the index.
@@ -428,7 +426,6 @@ class NetworkAnalysis:
         9997      b          197  19.977029
         9998      b          198  15.233163
         9999      b          199   6.439002
         [10000 rows x 3 columns]
         Travel time from 1000 to 1000 points rowwise.
@@ -448,13 +445,13 @@ class NetworkAnalysis:
         997     997          997  19.968743
         998     998          998   9.484374
         999     999          999  14.892648
         [1000 rows x 3 columns]
         """
         if self._log:
             time_ = perf_counter()
-        self._prepare_network_analysis(origins, destinations)
+        self._prepare_network_analysis(origins, destinations, rowwise)
         results = _od_cost_matrix(
             graph=self.graph,
@@ -465,9 +462,6 @@ class NetworkAnalysis:
             rowwise=rowwise,
         )
-        self.origins._get_n_missing(results, "origin")
-        self.destinations._get_n_missing(results, "destination")
         results["origin"] = results["origin"].map(self.origins.idx_dict)
         results["destination"] = results["destination"].map(self.destinations.idx_dict)
@@ -519,12 +513,17 @@ class NetworkAnalysis:
         Examples
         --------
+        Create the NetworkAnalysis instance.
+        >>> import sgis as sg
+        >>> roads = sg.read_parquet_url("https://media.githubusercontent.com/media/statisticsnorway/ssb-sgis/main/tests/testdata/roads_eidskog_2022.parquet")
+        >>> nw = sg.DirectedNetwork(roads).remove_isolated().make_directed_network_norway()
+        >>> rules = sg.NetworkAnalysisRules(weight="minutes")
+        >>> nwa = sg.NetworkAnalysis(network=nw, rules=rules, detailed_log=False)
         Get routes from 1 to 1000 points.
-        import sgis as sg
-        >>> points = sg.read_parquet_url(
-        ...     "https://media.githubusercontent.com/media/statisticsnorway/ssb-sgis/main/tests/testdata/points_oslo.parquet"
-        ... )
+        >>> points = sg.read_parquet_url("https://media.githubusercontent.com/media/statisticsnorway/ssb-sgis/main/tests/testdata/points_oslo.parquet")
         >>> routes = nwa.get_route(points.iloc[[0]], points)
         >>> routes
@@ -546,7 +545,7 @@ class NetworkAnalysis:
         if self._log:
             time_ = perf_counter()
-        self._prepare_network_analysis(origins, destinations)
+        self._prepare_network_analysis(origins, destinations, rowwise)
         results = _get_route(
             graph=self.graph,
@@ -557,15 +556,9 @@ class NetworkAnalysis:
             rowwise=rowwise,
         )
-        self.origins._get_n_missing(results, "origin")
-        self.destinations._get_n_missing(results, "destination")
         results["origin"] = results["origin"].map(self.origins.idx_dict)
         results["destination"] = results["destination"].map(self.destinations.idx_dict)
-        if isinstance(results, GeoDataFrame):
-            results = _push_geom_col(results)
         if self.rules.split_lines:
             self._unsplit_network()
@@ -628,10 +621,15 @@ class NetworkAnalysis:
         Examples
         --------
-        import sgis as sg
-        >>> points = sg.read_parquet_url(
-        ...     "https://media.githubusercontent.com/media/statisticsnorway/ssb-sgis/main/tests/testdata/points_oslo.parquet"
-        ... )
+        Create the NetworkAnalysis instance.
+        >>> import sgis as sg
+        >>> roads = sg.read_parquet_url("https://media.githubusercontent.com/media/statisticsnorway/ssb-sgis/main/tests/testdata/roads_eidskog_2022.parquet")
+        >>> nw = sg.DirectedNetwork(roads).remove_isolated().make_directed_network_norway()
+        >>> rules = sg.NetworkAnalysisRules(weight="minutes")
+        >>> nwa = sg.NetworkAnalysis(network=nw, rules=rules, detailed_log=False)
+        >>> points = sg.read_parquet_url("https://media.githubusercontent.com/media/statisticsnorway/ssb-sgis/main/tests/testdata/points_oslo.parquet")
         >>> point1 = points.iloc[[0]]
         >>> point2 = points.iloc[[1]]
@@ -656,8 +654,9 @@ class NetworkAnalysis:
         8       0            1  16.513253   9  MULTILINESTRING Z ((272281.367 6653079.745 160...
         9       0            1  16.551196  10  MULTILINESTRING Z ((272281.367 6653079.745 160...
-        We got all 10 routes because only the middle 1 percent of the routes are removed in
-        each iteration. Let's compare with dropping middle 50 and middle 100 percent.
+        We got all 10 routes because only the middle 1 percent of the routes are
+        removed in each iteration. Let's compare with dropping middle 50 and middle
+        100 percent.
         >>> k_routes = nwa.get_k_routes(
         ...             point1,
@@ -689,9 +688,9 @@ class NetworkAnalysis:
         if self._log:
             time_ = perf_counter()
-        self._prepare_network_analysis(origins, destinations)
+        self._prepare_network_analysis(origins, destinations, rowwise)
-        results = _get_route(
+        results = _get_k_routes(
             graph=self.graph,
             origins=self.origins.gdf,
             destinations=self.destinations.gdf,
@@ -702,9 +701,6 @@ class NetworkAnalysis:
             drop_middle_percent=drop_middle_percent,
         )
-        self.origins._get_n_missing(results, "origin")
-        self.destinations._get_n_missing(results, "destination")
         results["origin"] = results["origin"].map(self.origins.idx_dict)
         results["destination"] = results["destination"].map(self.destinations.idx_dict)
@@ -729,6 +725,8 @@ class NetworkAnalysis:
         self,
         origins: GeoDataFrame,
         destinations: GeoDataFrame,
+        weight_df: DataFrame | None = None,
+        rowwise: bool = False,
         frequency_col: str = "frequency",
     ) -> GeoDataFrame:
         """Finds the number of times each line segment was visited in all trips.
@@ -738,9 +736,18 @@ class NetworkAnalysis:
         segment was used. The aggregation is done on the line indices, which is much
         faster than getting the geometries and then dissolving.
+        The trip frequencies can be weighted (multiplied) based on 'weight_df'. See
+        example below.
         Args:
-            origins: GeoDataFrame of points from where the routes will originate
-            destinations: GeoDataFrame of points from where the routes will terminate
+            origins: GeoDataFrame of points from where the routes will originate.
+            destinations: GeoDataFrame of points from where the routes will terminate.
+            weight_df: A long formated DataFrame where each row contains the indices of
+                an origin-destination pair and the number to multiply the frequency for
+                this route by. The DataFrame can either contain three columns (origin
+                index, destination index and weight. In that order) or only a weight
+                column and a MultiIndex where level 0 is origin index and level 1 is
+                destination index.
             frequency_col: Name of column with the number of times each road was
                 visited. Defaults to 'frequency'.
@@ -753,52 +760,146 @@ class NetworkAnalysis:
             The resulting lines will keep all columns of the 'gdf' of the Network.
         Raises:
-            ValueError: if no paths were found.
+            ValueError: If no paths were found.
+            ValueError: If weight_df is not a DataFrame with one or three columns.
+            ValueError: If weight_df is given and the index of origins/destinations
+                is not unique.
         Examples
         --------
+        Create the NetworkAnalysis instance.
+        >>> import sgis as sg
+        >>> import pandas as pd
+        >>> roads = sg.read_parquet_url("https://media.githubusercontent.com/media/statisticsnorway/ssb-sgis/main/tests/testdata/roads_eidskog_2022.parquet")
+        >>> nw = sg.DirectedNetwork(roads).remove_isolated().make_directed_network_norway()
+        >>> rules = sg.NetworkAnalysisRules(weight="minutes")
+        >>> nwa = sg.NetworkAnalysis(network=nw, rules=rules, detailed_log=False)
         Get number of times each road was visited for trips from 25 to 25 points.
-        import sgis as sg
-        >>> points = sg.read_parquet_url(
-        ...     "https://media.githubusercontent.com/media/statisticsnorway/ssb-sgis/main/tests/testdata/points_oslo.parquet"
-        ... )
+        >>> points = sg.read_parquet_url("https://media.githubusercontent.com/media/statisticsnorway/ssb-sgis/main/tests/testdata/points_oslo.parquet")
-        >>> frequencies = nwa.get_route_frequencies(points.sample(25), points.sample(25))
+        >>> origins = points.iloc[:25]
+        >>> destinations = points.iloc[25:50]
+        >>> frequencies = nwa.get_route_frequencies(origins, destinations)
         >>> frequencies[["source", "target", "frequency", "geometry"]]
-               source target   frequency                                          geometry
-        137866  19095  44962    1.0      LINESTRING Z (265476.114 6645475.318 160.724, ...
-        138905  30597  16266    1.0      LINESTRING Z (272648.400 6652234.800 178.170, ...
-        138903  16266  45388    1.0      LINESTRING Z (272642.602 6652236.229 178.687, ...
-        138894  43025  30588    1.0      LINESTRING Z (272446.600 6652253.700 162.970, ...
-        138892  30588  16021    1.0      LINESTRING Z (272414.400 6652263.100 161.170, ...
-        ...       ...    ...    ...                                                    ...
-        158287  78157  78156  176.0      LINESTRING Z (263975.482 6653605.092 132.739, ...
-        149697  72562  72563  180.0      LINESTRING Z (265179.202 6651549.723 81.532, 2...
-        149698  72563  72564  180.0      LINESTRING Z (265178.761 6651549.956 81.561, 2...
-        149695  72560  72561  180.0      LINESTRING Z (265457.755 6651249.238 76.502, 2...
-        149696  72561  72562  180.0      LINESTRING Z (265180.086 6651549.259 81.473, 2...
-        [12231 rows x 4 columns]
+               source target  frequency                                           geometry
+        160188  77264  79112        1.0  LINESTRING Z (268641.225 6651871.624 111.355, ...
+        153682  68376   4136        1.0  LINESTRING Z (268542.700 6652162.400 121.266, ...
+        153679  75263  75502        1.0  LINESTRING Z (268665.600 6652165.400 117.466, ...
+        153678  75262  75263        1.0  LINESTRING Z (268660.000 6652167.100 117.466, ...
+        153677  47999  75262        1.0  LINESTRING Z (268631.500 6652176.800 118.166, ...
+        ...       ...    ...        ...                                                ...
+        151465  73801  73802      103.0  LINESTRING Z (265368.600 6647142.900 131.660, ...
+        151464  73800  73801      103.0  LINESTRING Z (265362.800 6647137.100 131.660, ...
+        151466  73802  73632      103.0  LINESTRING Z (265371.400 6647147.900 131.660, ...
+        151463  73799  73800      123.0  LINESTRING Z (265359.600 6647135.400 131.660, ...
+        152170  74418  74246      130.0  LINESTRING Z (264579.835 6651954.573 113.209, ...
+        [8556 rows x 4 columns]
+        The frequencies can be weighted for each origin-destination pair by specifying
+        'weight_df'. This can be a DataFrame with three columns, where the first two
+        contain the indices of the origin and destination (in that order), and the
+        third the number to multiply the frequency by. 'weight_df' can also be a
+        DataFrame with a 2-leveled MultiIndex, where level 0 is the origin index and
+        level 1 is the destination.
+        Constructing a DataFrame with all od-pair combinations and give all rows a
+        weight of 10.
+        >>> od_pairs = pd.MultiIndex.from_product(
+        ...     [origins.index, destinations.index], names=["origin", "destination"]
+        ... )
+        >>> weight_df = pd.DataFrame(index=od_pairs).reset_index()
+        >>> weight_df["weight"] = 10
+        >>> weight_df
+             origin  destination  weight
+        0         0           25      10
+        1         0           26      10
+        2         0           27      10
+        3         0           28      10
+        4         0           29      10
+        ..      ...          ...     ...
+        620      24           45      10
+        621      24           46      10
+        622      24           47      10
+        623      24           48      10
+        624      24           49      10
+        [625 rows x 3 columns]
+        All frequencies will now be multiplied by 10.
+        >>> frequencies = nwa.get_route_frequencies(origins, destinations, weight_df, weight_df=weight_df)
+        >>> frequencies[["source", "target", "frequency", "geometry"]]
+               source target  frequency                                           geometry
+        160188  77264  79112       10.0  LINESTRING Z (268641.225 6651871.624 111.355, ...
+        153682  68376   4136       10.0  LINESTRING Z (268542.700 6652162.400 121.266, ...
+        153679  75263  75502       10.0  LINESTRING Z (268665.600 6652165.400 117.466, ...
+        153678  75262  75263       10.0  LINESTRING Z (268660.000 6652167.100 117.466, ...
+        153677  47999  75262       10.0  LINESTRING Z (268631.500 6652176.800 118.166, ...
+        ...       ...    ...        ...                                                ...
+        151465  73801  73802     1030.0  LINESTRING Z (265368.600 6647142.900 131.660, ...
+        151464  73800  73801     1030.0  LINESTRING Z (265362.800 6647137.100 131.660, ...
+        151466  73802  73632     1030.0  LINESTRING Z (265371.400 6647147.900 131.660, ...
+        151463  73799  73800     1230.0  LINESTRING Z (265359.600 6647135.400 131.660, ...
+        152170  74418  74246     1300.0  LINESTRING Z (264579.835 6651954.573 113.209, ...
+        [8556 rows x 4 columns]
+        'weight_df' can also be a DataFrame with one column (the weight) and a
+        MultiIndex.
+        >>> weight_df = pd.DataFrame(index=od_pairs)
+        >>> weight_df["weight"] = 10
+        >>> weight_df
+               weight
+        0  25      10
+           26      10
+           27      10
+           28      10
+           29      10
+        ...       ...
+        24 45      10
+           46      10
+           47      10
+           48      10
+           49      10
         """
         if self._log:
             time_ = perf_counter()
-        self._prepare_network_analysis(origins, destinations)
+        if weight_df is not None:
+            weight_df = self._prepare_weight_df(weight_df, origins, destinations)
-        results = _get_route(
+        self._prepare_network_analysis(origins, destinations, rowwise)
+        if weight_df is not None:
+            ori_idx_mapper = {v: k for k, v in self.origins.idx_dict.items()}
+            des_idx_mapper = {v: k for k, v in self.destinations.idx_dict.items()}
+            multiindex_mapper = lambda x: (
+                ori_idx_mapper.get(x[0]),
+                des_idx_mapper.get(x[1]),
+            )
+            weight_df.index = weight_df.index.map(multiindex_mapper)
+        results = _get_route_frequencies(
             graph=self.graph,
             origins=self.origins.gdf,
             destinations=self.destinations.gdf,
-            weight=self.rules.weight,
             roads=self.network.gdf,
-            summarise=True,
+            weight_df=weight_df,
+            rowwise=rowwise,
         )
         if isinstance(results, GeoDataFrame):
             results = _push_geom_col(results)
-        results = results.rename(columns={"n": frequency_col}).sort_values(
+        results = results.rename(columns={"frequency": frequency_col}).sort_values(
             frequency_col
         )
@@ -849,13 +950,17 @@ class NetworkAnalysis:
         Examples
         --------
-        import sgis as sg
-        >>> points = sg.read_parquet_url(
-        ...     "https://media.githubusercontent.com/media/statisticsnorway/ssb-sgis/main/tests/testdata/points_oslo.parquet"
-        ... )
+        Create the NetworkAnalysis instance.
+        >>> import sgis as sg
+        >>> roads = sg.read_parquet_url("https://media.githubusercontent.com/media/statisticsnorway/ssb-sgis/main/tests/testdata/roads_eidskog_2022.parquet")
+        >>> nw = sg.DirectedNetwork(roads).remove_isolated().make_directed_network_norway()
+        >>> rules = sg.NetworkAnalysisRules(weight="minutes")
+        >>> nwa = sg.NetworkAnalysis(network=nw, rules=rules, detailed_log=False)
         10 minute service area for three origin points.
+        >>> points = sg.read_parquet_url("https://media.githubusercontent.com/media/statisticsnorway/ssb-sgis/main/tests/testdata/points_oslo.parquet")
         >>> service_areas = nwa.service_area(
         ...         points.loc[:2],
         ...         breaks=10,
@@ -890,10 +995,6 @@ class NetworkAnalysis:
         # sort the breaks as an np.ndarray
         breaks = self._sort_breaks(breaks)
-        self.network.gdf["source_target_weight"] = _edge_ids(
-            self.network.gdf, self.rules.weight
-        )
         results = _service_area(
             graph=self.graph,
             origins=self.origins.gdf,
@@ -977,13 +1078,18 @@ class NetworkAnalysis:
         Examples
         --------
-        import sgis as sg
-        >>> points = sg.read_parquet_url(
-        ...     "https://media.githubusercontent.com/media/statisticsnorway/ssb-sgis/main/tests/testdata/points_oslo.parquet"
-        ... )
+        Create the NetworkAnalysis instance.
+        >>> import sgis as sg
+        >>> roads = sg.read_parquet_url("https://media.githubusercontent.com/media/statisticsnorway/ssb-sgis/main/tests/testdata/roads_eidskog_2022.parquet")
+        >>> nw = sg.DirectedNetwork(roads).remove_isolated().make_directed_network_norway()
+        >>> rules = sg.NetworkAnalysisRules(weight="minutes")
+        >>> nwa = sg.NetworkAnalysis(network=nw, rules=rules, detailed_log=False)
         10 minute service area for one origin point.
+        >>> points = sg.read_parquet_url("https://media.githubusercontent.com/media/statisticsnorway/ssb-sgis/main/tests/testdata/points_oslo.parquet")
         >>> sa = nwa.precice_service_area(
         ...         points.iloc[[0]],
         ...         breaks=10,
@@ -1016,10 +1122,6 @@ class NetworkAnalysis:
         # sort the breaks as an np.ndarray
         breaks = self._sort_breaks(breaks)
-        self.network.gdf["source_target_weight"] = _edge_ids(
-            self.network.gdf, self.rules.weight
-        )
         results = _service_area(
             graph=self.graph,
             origins=self.origins.gdf,
@@ -1070,6 +1172,64 @@ class NetworkAnalysis:
         return results
+    @staticmethod
+    def _prepare_weight_df(weight_df, origins, destinations):
+        """Copy weight_df, convert to MultiIndex (if needed), then validate it.
+        The weight_df needs to have a very specific shape and index. If a 3-columned df
+        is given, convert the first two to a MultiIndex.
+        Then make sure this index matches the index of origins and destinations.
+        """
+        error_message = (
+            "'weight_df' should be a DataFrame with the columns "
+            "'origin', 'destination' and 'weight', where the first "
+            "two contain the indices of the origins and destinations "
+            "and the weight column contains the number to multiply "
+            "the trip frequency for this origin-destination pair."
+        )
+        if not isinstance(weight_df, DataFrame):
+            raise ValueError(error_message)
+        weight_df = weight_df.copy()
+        if len(weight_df.columns) == 3:
+            weight_df = weight_df.set_index(list(weight_df.columns[:2]))
+        if len(weight_df.columns) != 1 and isinstance(weight_df.index, pd.MultiIndex):
+            raise ValueError(error_message)
+        if not weight_df.index.is_unique:
+            raise ValueError("'weight_df' must contain only unique OD combinations.")
+        if not origins.index.is_unique:
+            raise ValueError(
+                "The index of 'origins' must be unque when using a 'weight_df'."
+            )
+        if not destinations.index.is_unique:
+            raise ValueError(
+                "The index of 'destinations' must be unque when using a 'weight_df'."
+            )
+        # check if any/all indices are in origins/destinations.
+        # Doing 'any' to give better error message
+        level_0 = weight_df.index.get_level_values(0)
+        if not level_0.isin(origins.index).any():
+            raise ValueError("None of the 'origins' indices are in 'weight_df'.")
+        level_1 = weight_df.index.get_level_values(1)
+        if not level_1.isin(destinations.index).any():
+            raise ValueError("None of the 'destinations' indices are in 'weight_df'.")
+        if not level_0.isin(origins.index).all():
+            raise ValueError("Not all 'origins' indices are in 'weight_df'.")
+        if not level_1.isin(destinations.index).all():
+            raise ValueError("Not all 'destinations' indices are in 'weight_df'.")
+        return weight_df
     def _log_df_template(self, method: str, minutes_elapsed: float) -> DataFrame:
         """Creates a DataFrame with one row and the main columns.
@@ -1149,13 +1309,22 @@ class NetworkAnalysis:
         self.log = pd.concat([self.log, df], ignore_index=True)
-    def _prepare_network_analysis(self, origins, destinations=None) -> None:
+    def _prepare_network_analysis(
+        self, origins, destinations=None, rowwise=False
+    ) -> None:
         """Prepares the weight column, node ids, origins, destinations and graph.
         Updates the graph only if it is not yet created and no parts of the analysis
         has changed. this method is run inside od_cost_matrix, get_route and
         service_area.
         """
+        if rowwise and len(origins) != len(destinations):
+            raise ValueError(
+                "'origins' and 'destinations' must have the same length when "
+                "rowwise=True"
+            )
         self.network.gdf = self.rules._validate_weight(self.network.gdf)
         self.origins = Origins(origins)
@@ -1175,10 +1344,13 @@ class NetworkAnalysis:
         if not self._graph_is_up_to_date() or not self.network._nodes_are_up_to_date():
             self.network._update_nodes_if()
-            edges, weights = self._get_edges_and_weights()
+            edges, weights, ids = self._get_edges_and_weights()
             self.graph = self._make_graph(
-                edges=edges, weights=weights, directed=self.network._as_directed
+                edges=edges,
+                weights=weights,
+                edge_ids=ids,
+                directed=self.network._as_directed,
             )
             self._add_missing_vertices()
@@ -1186,7 +1358,9 @@ class NetworkAnalysis:
         self._update_wkts()
         self.rules._update_rules()
-    def _get_edges_and_weights(self) -> tuple[list[tuple[str, str]], list[float]]:
+    def _get_edges_and_weights(
+        self,
+    ) -> tuple[list[tuple[str, str]], list[float], list[str]]:
         """Creates lists of edges and weights which will be used to make the graph.
         Edges and weights between origins and nodes and nodes and destinations are
@@ -1203,15 +1377,14 @@ class NetworkAnalysis:
                     start=max(self.origins.gdf.temp_idx.astype(int)) + 1
                 )
-        edges = [
-            (str(source), str(target))
-            for source, target in zip(
-                self.network.gdf["source"], self.network.gdf["target"], strict=True
-            )
-        ]
+        edges: list[tuple[str, str]] = self.network.get_edges()
         weights = list(self.network.gdf[self.rules.weight])
+        self.network.gdf["source_target_weight"] = self.network._create_edge_ids(
+            edges, weights
+        )
         edges_start, weights_start = self.origins._get_edges_and_weights(
             nodes=self.network.nodes,
             rules=self.rules,
@@ -1221,7 +1394,8 @@ class NetworkAnalysis:
         weights = weights + weights_start
         if self.destinations is None:
-            return edges, weights
+            edge_ids = self.network._create_edge_ids(edges, weights)
+            return edges, weights, edge_ids
         edges_end, weights_end = self.destinations._get_edges_and_weights(
             nodes=self.network.nodes,
@@ -1231,7 +1405,9 @@ class NetworkAnalysis:
         edges = edges + edges_end
         weights = weights + weights_end
-        return edges, weights
+        edge_ids = self.network._create_edge_ids(edges, weights)
+        return edges, weights, edge_ids
     def _split_lines(self) -> None:
         if self.destinations is not None:
@@ -1304,6 +1480,7 @@ class NetworkAnalysis:
     def _make_graph(
         edges: list[tuple[str, ...]] | np.ndarray[tuple[str, ...]],
         weights: list[float] | np.ndarray[float],
+        edge_ids: np.ndarray,
         directed: bool,
     ) -> Graph:
         """Creates an igraph Graph from a list of edges and weights."""
@@ -1312,7 +1489,7 @@ class NetworkAnalysis:
         graph = igraph.Graph.TupleList(edges, directed=directed)
         graph.es["weight"] = weights
-        graph.es["source_target_weight"] = _edge_ids(edges, weights)
+        graph.es["source_target_weight"] = edge_ids
         graph.es["edge_tuples"] = edges
         graph.es["source"] = [edge[0] for edge in edges]
         graph.es["target"] = [edge[1] for edge in edges]
@@ -1339,6 +1516,7 @@ class NetworkAnalysis:
             if self._points_have_changed(self[points].gdf, what=points):
                 return False
+        #        if not self.gdf["source_target_weight"].
         return True
     def _points_have_changed(self, points: GeoDataFrame, what: str) -> bool:

ssb-sgis 0.1.5__py3-none-any.whl → 0.1.6__py3-none-any.whl

ssb-sgis 0.1.5py3-none-any.whl → 0.1.6py3-none-any.whl