PyPI - epyt-flow - Versions diffs - 0.1.0__py3-none-any.whl - Mend

epyt-flow 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (131) hide show

epyt_flow/EPANET/EPANET/SRC_engines/AUTHORS +28 -0
epyt_flow/EPANET/EPANET/SRC_engines/LICENSE +21 -0
epyt_flow/EPANET/EPANET/SRC_engines/Readme_SRC_Engines.txt +18 -0
epyt_flow/EPANET/EPANET/SRC_engines/enumstxt.h +134 -0
epyt_flow/EPANET/EPANET/SRC_engines/epanet.c +5578 -0
epyt_flow/EPANET/EPANET/SRC_engines/epanet2.c +865 -0
epyt_flow/EPANET/EPANET/SRC_engines/epanet2.def +131 -0
epyt_flow/EPANET/EPANET/SRC_engines/errors.dat +73 -0
epyt_flow/EPANET/EPANET/SRC_engines/funcs.h +193 -0
epyt_flow/EPANET/EPANET/SRC_engines/genmmd.c +1000 -0
epyt_flow/EPANET/EPANET/SRC_engines/hash.c +177 -0
epyt_flow/EPANET/EPANET/SRC_engines/hash.h +28 -0
epyt_flow/EPANET/EPANET/SRC_engines/hydcoeffs.c +1151 -0
epyt_flow/EPANET/EPANET/SRC_engines/hydraul.c +1117 -0
epyt_flow/EPANET/EPANET/SRC_engines/hydsolver.c +720 -0
epyt_flow/EPANET/EPANET/SRC_engines/hydstatus.c +476 -0
epyt_flow/EPANET/EPANET/SRC_engines/include/epanet2.h +431 -0
epyt_flow/EPANET/EPANET/SRC_engines/include/epanet2_2.h +1786 -0
epyt_flow/EPANET/EPANET/SRC_engines/include/epanet2_enums.h +468 -0
epyt_flow/EPANET/EPANET/SRC_engines/inpfile.c +810 -0
epyt_flow/EPANET/EPANET/SRC_engines/input1.c +707 -0
epyt_flow/EPANET/EPANET/SRC_engines/input2.c +864 -0
epyt_flow/EPANET/EPANET/SRC_engines/input3.c +2170 -0
epyt_flow/EPANET/EPANET/SRC_engines/main.c +93 -0
epyt_flow/EPANET/EPANET/SRC_engines/mempool.c +142 -0
epyt_flow/EPANET/EPANET/SRC_engines/mempool.h +24 -0
epyt_flow/EPANET/EPANET/SRC_engines/output.c +852 -0
epyt_flow/EPANET/EPANET/SRC_engines/project.c +1359 -0
epyt_flow/EPANET/EPANET/SRC_engines/quality.c +685 -0
epyt_flow/EPANET/EPANET/SRC_engines/qualreact.c +743 -0
epyt_flow/EPANET/EPANET/SRC_engines/qualroute.c +694 -0
epyt_flow/EPANET/EPANET/SRC_engines/report.c +1489 -0
epyt_flow/EPANET/EPANET/SRC_engines/rules.c +1362 -0
epyt_flow/EPANET/EPANET/SRC_engines/smatrix.c +871 -0
epyt_flow/EPANET/EPANET/SRC_engines/text.h +497 -0
epyt_flow/EPANET/EPANET/SRC_engines/types.h +874 -0
epyt_flow/EPANET/EPANET-MSX/MSX_Updates.txt +53 -0
epyt_flow/EPANET/EPANET-MSX/Src/dispersion.h +27 -0
epyt_flow/EPANET/EPANET-MSX/Src/hash.c +107 -0
epyt_flow/EPANET/EPANET-MSX/Src/hash.h +28 -0
epyt_flow/EPANET/EPANET-MSX/Src/include/epanetmsx.h +102 -0
epyt_flow/EPANET/EPANET-MSX/Src/include/epanetmsx_export.h +42 -0
epyt_flow/EPANET/EPANET-MSX/Src/mathexpr.c +937 -0
epyt_flow/EPANET/EPANET-MSX/Src/mathexpr.h +39 -0
epyt_flow/EPANET/EPANET-MSX/Src/mempool.c +204 -0
epyt_flow/EPANET/EPANET-MSX/Src/mempool.h +24 -0
epyt_flow/EPANET/EPANET-MSX/Src/msxchem.c +1285 -0
epyt_flow/EPANET/EPANET-MSX/Src/msxcompiler.c +368 -0
epyt_flow/EPANET/EPANET-MSX/Src/msxdict.h +42 -0
epyt_flow/EPANET/EPANET-MSX/Src/msxdispersion.c +586 -0
epyt_flow/EPANET/EPANET-MSX/Src/msxerr.c +116 -0
epyt_flow/EPANET/EPANET-MSX/Src/msxfile.c +260 -0
epyt_flow/EPANET/EPANET-MSX/Src/msxfuncs.c +175 -0
epyt_flow/EPANET/EPANET-MSX/Src/msxfuncs.h +35 -0
epyt_flow/EPANET/EPANET-MSX/Src/msxinp.c +1504 -0
epyt_flow/EPANET/EPANET-MSX/Src/msxout.c +401 -0
epyt_flow/EPANET/EPANET-MSX/Src/msxproj.c +791 -0
epyt_flow/EPANET/EPANET-MSX/Src/msxqual.c +2010 -0
epyt_flow/EPANET/EPANET-MSX/Src/msxrpt.c +400 -0
epyt_flow/EPANET/EPANET-MSX/Src/msxtank.c +422 -0
epyt_flow/EPANET/EPANET-MSX/Src/msxtoolkit.c +1164 -0
epyt_flow/EPANET/EPANET-MSX/Src/msxtypes.h +551 -0
epyt_flow/EPANET/EPANET-MSX/Src/msxutils.c +524 -0
epyt_flow/EPANET/EPANET-MSX/Src/msxutils.h +56 -0
epyt_flow/EPANET/EPANET-MSX/Src/newton.c +158 -0
epyt_flow/EPANET/EPANET-MSX/Src/newton.h +34 -0
epyt_flow/EPANET/EPANET-MSX/Src/rk5.c +287 -0
epyt_flow/EPANET/EPANET-MSX/Src/rk5.h +39 -0
epyt_flow/EPANET/EPANET-MSX/Src/ros2.c +293 -0
epyt_flow/EPANET/EPANET-MSX/Src/ros2.h +35 -0
epyt_flow/EPANET/EPANET-MSX/Src/smatrix.c +816 -0
epyt_flow/EPANET/EPANET-MSX/Src/smatrix.h +29 -0
epyt_flow/EPANET/EPANET-MSX/readme.txt +14 -0
epyt_flow/EPANET/compile.sh +4 -0
epyt_flow/VERSION +1 -0
epyt_flow/__init__.py +24 -0
epyt_flow/data/__init__.py +0 -0
epyt_flow/data/benchmarks/__init__.py +11 -0
epyt_flow/data/benchmarks/batadal.py +257 -0
epyt_flow/data/benchmarks/batadal_data.py +28 -0
epyt_flow/data/benchmarks/battledim.py +473 -0
epyt_flow/data/benchmarks/battledim_data.py +51 -0
epyt_flow/data/benchmarks/gecco_water_quality.py +267 -0
epyt_flow/data/benchmarks/leakdb.py +592 -0
epyt_flow/data/benchmarks/leakdb_data.py +18923 -0
epyt_flow/data/benchmarks/water_usage.py +123 -0
epyt_flow/data/networks.py +650 -0
epyt_flow/gym/__init__.py +4 -0
epyt_flow/gym/control_gyms.py +47 -0
epyt_flow/gym/scenario_control_env.py +101 -0
epyt_flow/metrics.py +404 -0
epyt_flow/models/__init__.py +2 -0
epyt_flow/models/event_detector.py +31 -0
epyt_flow/models/sensor_interpolation_detector.py +118 -0
epyt_flow/rest_api/__init__.py +4 -0
epyt_flow/rest_api/base_handler.py +70 -0
epyt_flow/rest_api/res_manager.py +95 -0
epyt_flow/rest_api/scada_data_handler.py +476 -0
epyt_flow/rest_api/scenario_handler.py +352 -0
epyt_flow/rest_api/server.py +106 -0
epyt_flow/serialization.py +438 -0
epyt_flow/simulation/__init__.py +5 -0
epyt_flow/simulation/events/__init__.py +6 -0
epyt_flow/simulation/events/actuator_events.py +259 -0
epyt_flow/simulation/events/event.py +81 -0
epyt_flow/simulation/events/leakages.py +404 -0
epyt_flow/simulation/events/sensor_faults.py +267 -0
epyt_flow/simulation/events/sensor_reading_attack.py +185 -0
epyt_flow/simulation/events/sensor_reading_event.py +170 -0
epyt_flow/simulation/events/system_event.py +88 -0
epyt_flow/simulation/parallel_simulation.py +147 -0
epyt_flow/simulation/scada/__init__.py +3 -0
epyt_flow/simulation/scada/advanced_control.py +134 -0
epyt_flow/simulation/scada/scada_data.py +1589 -0
epyt_flow/simulation/scada/scada_data_export.py +255 -0
epyt_flow/simulation/scenario_config.py +608 -0
epyt_flow/simulation/scenario_simulator.py +1897 -0
epyt_flow/simulation/scenario_visualizer.py +61 -0
epyt_flow/simulation/sensor_config.py +1289 -0
epyt_flow/topology.py +290 -0
epyt_flow/uncertainty/__init__.py +3 -0
epyt_flow/uncertainty/model_uncertainty.py +302 -0
epyt_flow/uncertainty/sensor_noise.py +73 -0
epyt_flow/uncertainty/uncertainties.py +555 -0
epyt_flow/uncertainty/utils.py +206 -0
epyt_flow/utils.py +306 -0
epyt_flow-0.1.0.dist-info/LICENSE +21 -0
epyt_flow-0.1.0.dist-info/METADATA +139 -0
epyt_flow-0.1.0.dist-info/RECORD +131 -0
epyt_flow-0.1.0.dist-info/WHEEL +5 -0
epyt_flow-0.1.0.dist-info/top_level.txt +1 -0

epyt_flow/data/benchmarks/battledim.py ADDED Viewed

@@ -0,0 +1,473 @@
+"""
+The Battle of the Leakage Detection and Isolation Methods (*BattLeDIM*) 2020, organized by
+S. G. Vrachimis, D. G. Eliades, R. Taormina, Z. Kapelan, A. Ostfeld, S. Liu, M. Kyriakou,
+P. Pavlou, M. Qiu, and M. M. Polycarpou, as part of the 2nd International CCWI/WDSA Joint
+Conference in Beijing, China, aims at objectively comparing the performance of methods for
+the detection and localization of leakage events, relying on SCADA measurements of flow and
+pressure sensors installed within water distribution networks.
+See https://github.com/KIOS-Research/BattLeDIM for details.
+This module provides functions for loading the original BattLeDIM data set
+:func:`~epyt_flow.data.benchmarks.battledim.load_data`, as well as methods for loading the scenarios
+:func:`~epyt_flow.data.benchmarks.battledim.load_scenario` and pre-generated SCADA data
+:func:`~epyt_flow.data.benchmarks.battledim.load_scada_data`.
+The official scoring/evaluation is implemented in
+:func:`~epyt_flow.data.benchmarks.battledim.compute_evaluation_score` -- i.e. those results can be
+directly compared to the official leaderboard results.
+Besides this, the user can choose to evaluate predictions using any other metric from
+:mod:`~epyt_flow.metrics`.
+"""
+from typing import Any, Union
+import os
+import math
+from datetime import datetime
+import functools
+import scipy
+import pandas as pd
+import numpy as np
+from scipy.sparse import bsr_array
+from .battledim_data import START_TIME_TEST, START_TIME_TRAIN, LEAKS_CONFIG_TEST, \
+    LEAKS_CONFIG_TRAIN
+from ..networks import load_ltown
+from ...simulation.events import AbruptLeakage, IncipientLeakage, Leakage
+from ...simulation import ScenarioConfig
+from ...topology import NetworkTopology
+from ...simulation.scada import ScadaData
+from ...utils import get_temp_folder, to_seconds, create_path_if_not_exist, download_if_necessary
+def __parse_leak_config(start_time: str, leaks_config: str) -> list[Leakage]:
+    leakages = []
+    for leak in leaks_config.splitlines():
+        # Parse entry
+        items = [i.strip() for i in leak.split(",")]
+        leaky_pipe_id = items[0]
+        leak_start_time = int((datetime.strptime(items[1], "%Y-%m-%d %H:%M") - start_time)
+                              .total_seconds())
+        leak_end_time = int((datetime.strptime(items[2], "%Y-%m-%d %H:%M") - start_time)
+                            .total_seconds())
+        leak_diameter = float(items[3])
+        leak_type = items[4]
+        leak_peak_time = int((datetime.strptime(items[5], "%Y-%m-%d %H:%M") - start_time)
+                             .total_seconds())
+        # Create leak config
+        if leak_type == "incipient":
+            leak = IncipientLeakage(link_id=leaky_pipe_id, diameter=leak_diameter,
+                                    start_time=leak_start_time, end_time=leak_end_time,
+                                    peak_time=leak_peak_time)
+        elif leak_type == "abrupt":
+            leak = AbruptLeakage(link_id=leaky_pipe_id, diameter=leak_diameter,
+                                 start_time=leak_start_time, end_time=leak_end_time)
+        leakages.append(leak)
+    return leakages
+def __create_labels(n_time_steps: int, return_test_scenario: bool,
+                    links: list[str]) -> tuple[np.ndarray, scipy.sparse.bsr_array]:
+    y = np.zeros(n_time_steps)
+    start_time = START_TIME_TEST if return_test_scenario is True else START_TIME_TRAIN
+    leaks_config = LEAKS_CONFIG_TEST if return_test_scenario is True else LEAKS_CONFIG_TRAIN
+    leakages = __parse_leak_config(start_time, leaks_config)
+    def leak_time_to_idx(t: int, round_up: bool = False):
+        if round_up is False:
+            return math.floor(t / 300)
+        else:
+            return math.ceil(t / 300)
+    leak_locations_row = []
+    leak_locations_col = []
+    for leak in leakages:
+        t_idx_start = leak_time_to_idx(leak.start_time)
+        t_idx_end = leak_time_to_idx(leak.end_time, round_up=True)
+        y[t_idx_start:t_idx_end] = 1
+        leak_link_idx = links.index(leak.link_id)
+        for t in range(t_idx_end - t_idx_start):
+            leak_locations_row.append(t_idx_start + t)
+            leak_locations_col.append(leak_link_idx)
+    y_leak_locations = bsr_array(
+        (np.ones(len(leak_locations_row)), (leak_locations_row, leak_locations_col)),
+        shape=(n_time_steps, len(links)))
+    return y, y_leak_locations
+def compute_evaluation_score(y_leak_locations_pred: list[tuple[str, int]],
+                             test_scenario: bool, verbose: bool = True) -> dict:
+    """
+    Evaluates the predictions (i.e. start time and location of leakages) as it was done in the
+    BattLeDIM competition -- i.e. the output of this functions can be directly compared
+    to the official leaderboard results.
+    Parameters
+    ----------
+    y_leak_locations_pred : `list[tuple[str, int]]`
+        Predictions of location (link/pipe ID) and start time
+        (in seconds since simulation start) of leakages.
+    test_scenario : `bool`
+        True if the given predictions are made for the test scenario, False otherwise.
+    verbose : `bool`, optional
+        If True, a progress bar is shown while downloading files.
+        The default is True.
+    Returns
+    -------
+    `dict`
+        Dictionary containing the true positive rate, true positives, false positives,
+        false negatives, and total monetary (Euro) savings (only available if `test_scenario`
+        is True).
+    """
+    # Original MATLAB implementation:
+    # https://github.com/KIOS-Research/BattLeDIM/blob/master/Scoring%20Algorithm/Scoring_Algorithm.m
+    # Scoring parameters
+    dist_max = 300      # Max pipe distance for leakage detection (meters)
+    cost_water = .8     # Cost of water per m3 (Euro)
+    cost_crew = 500     # Max repair crew cost per assignment (Euro)
+    hydraulic_time_step = to_seconds(minutes=5)
+    # Get WDN topology and find minimum topological distance (using the pipe lengths)
+    # between all nodes
+    f_topology_in = os.path.join(get_temp_folder(), "BattLeDIM", "ltown.epytflow_topology")
+    url_topology = "https://filedn.com/lumBFq2P9S74PNoLPWtzxG4/EPyT-Flow/BattLeDIM/" +\
+        "ltown.epytflow_topology"
+    download_if_necessary(f_topology_in, url_topology, verbose)
+    topology = NetworkTopology.load_from_file(f_topology_in)
+    all_pairs_shortest_path_length = topology.get_all_pairs_shortest_path_length()
+    # Load ground truth
+    sim_start_time = START_TIME_TEST if test_scenario is True else START_TIME_TRAIN
+    leaks_config = LEAKS_CONFIG_TEST if test_scenario is True else LEAKS_CONFIG_TRAIN
+    leakages = __parse_leak_config(sim_start_time, leaks_config)
+    n_leakages = len(leakages)
+    leak_demands = {}
+    if test_scenario is True:
+        # Download leak demands
+        for leak in leakages:
+            f_in = f"Leak_{leak.link_id}.xlsx"
+            url = "https://raw.githubusercontent.com/KIOS-Research/BattLeDIM/master/" + \
+                f"Scoring%20Algorithm/competition_leakages/{f_in}"
+            f_local_in = os.path.join(get_temp_folder(), "BattLeDIM", f_in)
+            download_if_necessary(f_local_in, url, verbose)
+            df_leak_demand = pd.read_excel(f_local_in, sheet_name="Demand (m3_h)")
+            leak_demand = df_leak_demand[leak.link_id].to_numpy()
+            leak_demands[leak.link_id] = leak_demand
+    # Evaluate given predictions/alarms
+    total_savings = 0
+    true_positives = 0
+    false_positives = 0
+    detected_leaks = []
+    leak_data = []
+    for leak in leakages:
+        leak_data.append((leak.link_id, leak.start_time, leak.end_time))
+    def __find_closest_leaky_pipe(link_id) -> tuple[str, float, int]:
+        closest_leaky_pipe_id = None
+        closest_dist = float("inf")
+        closest_start_time = None
+        closest_end_time = None
+        node_a, node_b = topology.get_link_info(link_id)["nodes"]
+        for leak_pipe_id, start_time_leak, end_time_leak in leak_data:
+            link_info = topology.get_link_info(leak_pipe_id)
+            end_node_a, end_node_b = link_info["nodes"]
+            link_length = link_info["length"]
+            dists = []
+            dists.append(all_pairs_shortest_path_length[node_a][end_node_a] + .5 * link_length)
+            dists.append(all_pairs_shortest_path_length[node_a][end_node_b] + .5 * link_length)
+            dists.append(all_pairs_shortest_path_length[node_b][end_node_a] + .5 * link_length)
+            dists.append(all_pairs_shortest_path_length[node_b][end_node_b] + .5 * link_length)
+            if min(dists) < closest_dist:
+                closest_dist = min(dists)
+                closest_leaky_pipe_id = leak_pipe_id
+                closest_start_time = start_time_leak
+                closest_end_time = end_time_leak
+        return closest_leaky_pipe_id, closest_dist, closest_start_time, closest_end_time
+    for pipe_id, start_time in y_leak_locations_pred:
+        # Check if leakages was found and if so, how far away it is from the ground truth
+        leaky_pipe_dist = None
+        leaky_pipe = None
+        if any(pipe_id == leaky_pipe_id and start_time >= start_time_leak and
+               start_time <= end_time_leak and
+               pipe_id not in detected_leaks
+               for leaky_pipe_id, start_time_leak, end_time_leak in leak_data):
+            leaky_pipe_dist = 0
+            leaky_pipe = pipe_id
+        else:
+            closest_leaky_pipe_id, dist, start_time_leak, end_time_leak = \
+                __find_closest_leaky_pipe(pipe_id)
+            if start_time >= start_time_leak and start_time <= end_time_leak:
+                leaky_pipe_dist = dist
+                leaky_pipe = closest_leaky_pipe_id
+        # Compute score of current alarm
+        if leaky_pipe is not None:
+            detected_leaks.append(leaky_pipe)
+            true_positives += 1
+            water_saved = 0
+            if leaky_pipe in leak_demands:
+                leak_demand = leak_demands[leaky_pipe]
+                start_time_idx = math.ceil(start_time / hydraulic_time_step)
+                water_saved = np.sum(leak_demand[start_time_idx:])
+            total_savings += water_saved * cost_water - (leaky_pipe_dist / dist_max) * cost_crew
+        else:
+            false_positives += 1
+            total_savings += -1. * cost_crew
+    # Compute final scores
+    false_negatives = n_leakages - true_positives
+    true_positive_rate = true_positives / (true_positives + false_negatives)
+    return {"true_positive_rate": true_positive_rate, "true_positives": true_positives,
+            "false_positives": false_positives, "false_negatives": false_negatives,
+            "total_savings": total_savings if test_scenario is True else None}
+def load_data(return_test_scenario: bool, download_dir: str = None, return_X_y: bool = False,
+              return_features_desc: bool = False, return_leak_locations: bool = False,
+              verbose: bool = True) -> Union[pd.DataFrame, Any]:
+    """
+    Loads the original BattLeDIM benchmark data set.
+    Note that the data set exists in two different version --
+    a training version and an evaluation/test version.
+    Parameters
+    ----------
+    return_test_scenario : `bool`
+        If True, the evaluation/test data set is returned, otherwise the historical
+        (i.e. training) data set is returned.
+    download_dir : `str`, optional
+        Path to the data files -- if None, the temp folder will be used.
+        If the path does not exist, the data files will be downloaded to the given path.
+        The default is None.
+    return_X_y : `bool`, optional
+        If True, the data is returned together with the labels (presence of a leakage) as
+        two Numpy arrays, otherwise, the data is returned as a
+        :class:`~epyt_flow.simulation.scada.scada_data.ScadaData` instance.
+        The default is False.
+    return_features_desc : `bool`, optional
+        If True and if `return_X_y` is True, the returned dictionary contains the
+        features' descriptions (i.e. names) under the key "features_desc".
+        The default is False.
+    return_leak_locations : `bool`
+        If True, the leak locations are returned as well --
+        as an instance of `scipy.sparse.bsr_array`.
+        The default is False.
+    verbose : `bool`, optional
+        If True, a progress bar is shown while downloading files.
+        The default is True.
+    Returns
+    -------
+    Either a `pandas.DataFrame` instance or a tuple of Numpy arrays.
+        Benchmark data set.
+    """
+    # Download data files if necessary
+    if return_test_scenario is True:
+        url_data = "https://zenodo.org/records/4017659/files/2018_SCADA.xlsx?download=1"
+        f_in = "2018_SCADA.xlsx"
+    else:
+        url_data = "https://zenodo.org/records/4017659/files/2019_SCADA.xlsx?download=1"
+        f_in = "2019_SCADA.xlsx"
+    download_dir = download_dir if download_dir is not None else get_temp_folder()
+    download_dir = os.path.join(download_dir, "BattLeDIM")
+    create_path_if_not_exist(download_dir)
+    f_in = os.path.join(download_dir, f_in)
+    download_if_necessary(f_in, url_data, verbose)
+    # Load and parse data files
+    df_pressures = pd.read_excel(f_in, sheet_name="Pressures (m)")
+    df_pressures.columns = ["Timestamp"] + [f"Pressure_{n_id}" for n_id in df_pressures.columns[1:]]
+    df_demands = pd.read_excel(f_in, sheet_name="Demands (L_h)")
+    df_demands.columns = ["Timestamp"] + [f"Demand_{n_id}" for n_id in df_demands.columns[1:]]
+    df_flows = pd.read_excel(f_in, sheet_name="Flows (m3_h)")
+    df_flows.columns = ["Timestamp"] + [f"Flow_{l_id}" for l_id in df_flows.columns[1:]]
+    df_levels = pd.read_excel(f_in, sheet_name="Levels (m)")
+    df_levels.columns = ["Timestamp"] + [f"Level_{t_id}" for t_id in df_levels.columns[1:]]
+    df_final = functools.reduce(lambda left, right: pd.merge(left, right, on="Timestamp"),
+                                [df_pressures, df_flows, df_levels, df_demands])
+    # Prepare and return final data
+    if return_X_y is True:
+        features_desc = list(df_final.columns)
+        features_desc.remove("Timestamp")
+        network_config = load_ltown(download_dir)
+        links = network_config.sensor_config.links
+        X = df_final[features_desc].to_numpy()
+        y, y_leak_locations = __create_labels(X.shape[0], return_test_scenario, links)
+        if return_features_desc is True:
+            if return_leak_locations is True:
+                return X, y, features_desc, y_leak_locations
+            else:
+                return X, y, features_desc
+        else:
+            if return_leak_locations is True:
+                return X, y, y_leak_locations
+            else:
+                return X, y
+    else:
+        return df_final
+def load_scada_data(return_test_scenario: bool, download_dir: str = None,
+                    return_X_y: bool = False, return_leak_locations: bool = False,
+                    verbose: bool = True) -> list[Union[ScadaData, Any]]:
+    """
+    Loads the SCADA data of the simulated BattLeDIM benchmark scenario -- note that due to
+    randomness, these differ from the original data set which can be loaded by calling
+    :func:`~epyt_flow.data.benchmarks.battledim.load_data`.
+    .. warning::
+        A large file (approx. 4GB) will be downloaded and loaded into memory --
+        this might take some time.
+    Parameters
+    ----------
+    return_test_scenario : `bool`
+        If True, the evaluation/test scenario is returned, otherwise the historical
+        (i.e. training) scenario is returned.
+    download_dir : `str`, optional
+        Path to the data files -- if None, the temp folder will be used.
+        If the path does not exist, the data files will be downloaded to the given path.
+        The default is None.
+    return_X_y : `bool`, optional
+        If True, the data is returned together with the labels (presence of a leakage) as
+        two Numpy arrays, otherwise, the data is returned as a
+        :class:`~epyt_flow.simulation.scada.scada_data.ScadaData` instance.
+        The default is False.
+    return_leak_locations : `bool`
+        If True, the leak locations are returned as well --
+        as an instance of `scipy.sparse.bsr_array`.
+        The default is False.
+    verbose : `bool`, optional
+        If True, a progress bar is shown while downloading files.
+        The default is True.
+    Returns
+    -------
+    :class:`~epyt_flow.simulation.scada.scada_data.ScadaData` or `list[tuple[numpy.ndarray, numpy.ndarray]]`
+        The simulated benchmark scenario as either a
+        :class:`~epyt_flow.simulation.scada.scada_data.ScadaData` instance or as a tuple of
+        (X, y) Numpy arrays. If 'return_leak_locations' is True, the leak locations are included
+        as an instance of `scipy.sparse.bsr_array` as well.
+    """
+    download_dir = download_dir if download_dir is not None else get_temp_folder()
+    url_data = "https://filedn.com/lumBFq2P9S74PNoLPWtzxG4/EPyT-Flow/BattLeDIM/"
+    f_in = f"{'battledim_test' if return_test_scenario else 'battledim_train'}.epytflow_scada_data"
+    download_if_necessary(os.path.join(download_dir, f_in), url_data + f_in, verbose)
+    data = ScadaData.load_from_file(os.path.join(download_dir, f_in))
+    X = data.get_data()
+    y, y_leak_locations = __create_labels(X.shape[0], return_test_scenario,
+                                          data.sensor_config.links)
+    if return_X_y is True:
+        if return_leak_locations is True:
+            return X, y, y_leak_locations
+        else:
+            return X, y
+    else:
+        if return_leak_locations is True:
+            return data, y_leak_locations
+        else:
+            return data
+def load_scenario(return_test_scenario: bool, download_dir: str = None,
+                  verbose: bool = True) -> ScenarioConfig:
+    """
+    Creates and returns the BattLeDIM scenario -- it can be either modified or
+    passed directly to the simulator
+    :class:`~epyt_flow.simulation.scenario_simulator.ScenarioSimulator`.
+    .. note::
+        Note that due to randomness, the simulation results differ from the original data set which
+        can be loaded by calling :func:`~epyt_flow.data.benchmarks.battledim.load_data`.
+    Parameters
+    ----------
+    return_test_scenario : `bool`
+        If True, the evaluation/test scenario is returned, otherwise the historical
+        (i.e. training) scenario is returned.
+    download_dir : `str`, optional
+        Path to the L-TOWN.inp file -- if None, the temp folder will be used.
+        If the path does not exist, the .inp will be downloaded to the given path.
+        The default is None.
+    verbose : `bool`, optional
+        If True, a progress bar is shown while downloading files.
+        The default is True.
+    Returns
+    -------
+    :class:`~epyt_flow.simulation.scenario_config.ScenarioConfig`
+        Complete scenario configuration of the BattLeDIM benchmark scenario.
+    """
+    # Load L-Town network including the sensor placement
+    if download_dir is not None:
+        ltown_config = load_ltown(download_dir=download_dir, use_realistic_demands=True,
+                                  include_default_sensor_placement=True, verbose=verbose)
+    else:
+        ltown_config = load_ltown(use_realistic_demands=True, include_default_sensor_placement=True,
+                                  verbose=verbose)
+    # Set simulation duration
+    general_params = {"simulation_duration": to_seconds(days=365),    # One year
+                      "hydraulic_time_step": to_seconds(minutes=5),   # 5min time steps
+                      "reporting_time_step": to_seconds(minutes=5)} | ltown_config.general_params
+    # Add events
+    start_time = START_TIME_TEST if return_test_scenario is True else START_TIME_TRAIN
+    leaks_config = LEAKS_CONFIG_TEST if return_test_scenario is True else LEAKS_CONFIG_TRAIN
+    leakages = __parse_leak_config(start_time, leaks_config)
+    # Build final scenario
+    return ScenarioConfig(f_inp_in=ltown_config.f_inp_in, general_params=general_params,
+                          sensor_config=ltown_config.sensor_config, system_events=leakages)

epyt_flow/data/benchmarks/battledim_data.py ADDED Viewed

@@ -0,0 +1,51 @@
+"""
+Module provides the leakage configurations for BattLeDIM.
+"""
+from datetime import datetime
+START_TIME_TRAIN = datetime.strptime("2018-01-01 00:00", "%Y-%m-%d %H:%M")
+LEAKS_CONFIG_TRAIN = \
+    """p257, 2018-01-08 13:30, 2018-12-31 23:55, 0.011843, incipient, 2018-01-25 08:30
+    p461, 2018-01-23 04:25, 2018-04-02 11:40, 0.021320, incipient, 2018-03-27 20:35
+    p232, 2018-01-31 02:35, 2018-02-10 09:20, 0.020108, incipient, 2018-02-03 16:05
+    p427, 2018-02-13 08:25, 2018-12-31 23:55, 0.0090731, incipient, 2018-05-14 19:25
+    p673, 2018-03-05 15:45, 2018-03-23 10:25, 0.022916, abrupt, 2018-03-05 15:45
+    p810, 2018-07-28 03:05, 2018-12-31 23:55, 0.010028, incipient, 2018-11-02 22:25
+    p628, 2018-05-02 14:55, 2018-05-29 21:20, 0.022318, incipient, 2018-05-16 08:00
+    p538, 2018-05-18 08:35, 2018-06-02 06:05, 0.021731, abrupt, 2018-05-18 08:35
+    p866, 2018-06-01 09:05, 2018-06-12 03:00, 0.018108, abrupt, 2018-06-01 09:05
+    p31, 2018-06-28 10:35, 2018-08-12 17:30, 0.016389, incipient, 2018-08-03 02:45
+    p654, 2018-07-05 03:40, 2018-12-31 23:55, 0.0087735, incipient, 2018-09-16 21:05
+    p183, 2018-08-07 02:35, 2018-09-01 17:10, 0.015853, abrupt, 2018-08-07 02:35
+    p158, 2018-10-06 02:35, 2018-10-23 13:35, 0.019364, abrupt, 2018-10-06 02:35
+    p369, 2018-10-26 02:05, 2018-11-08 20:25, 0.019363, abrupt, 2018-10-26 02:05"""
+START_TIME_TEST = datetime.strptime("2019-01-01 00:00", "%Y-%m-%d %H:%M")
+LEAKS_CONFIG_TEST = \
+    """p257, 2019-01-01 00:00, 2019-12-31 23:55, 0.011843, incipient, 2019-01-01 00:00
+    p427, 2019-01-01 00:00, 2019-12-31 23:55, 0.0090731, incipient, 2019-01-01 00:00
+    p810, 2019-01-01 00:00, 2019-12-31 23:55, 0.010028, incipient, 2019-01-01 00:00
+    p654, 2019-01-01 00:00, 2019-12-31 23:55, 0.0087735, incipient, 2019-01-01 00:00
+    p523, 2019-01-15 23:00, 2019-02-01 09:50, 0.020246, abrupt, 2019-01-15 23:00
+    p827, 2019-01-24 18:30, 2019-02-07 09:05, 0.02025, abrupt, 2019-01-24 18:30
+    p280, 2019-02-10 13:05, 2019-12-31 23:55, 0.0095008, abrupt, 2019-02-10 13:05
+    p653, 2019-03-03 13:10, 2019-05-05 12:10, 0.016035, incipient, 2019-04-21 19:00
+    p710, 2019-03-24 14:15, 2019-12-31 23:55, 0.0092936, abrupt, 2019-03-24 14:15
+    p514, 2019-04-02 20:40, 2019-05-23 14:55, 0.014979, abrupt, 2019-04-02 20:40
+    p331, 2019-04-20 10:10, 2019-12-31 23:55, 0.014053, abrupt, 2019-04-20 10:10
+    p193, 2019-05-19 10:40, 2019-12-31 23:55, 0.01239, incipient, 2019-07-25 03:20
+    p277, 2019-05-30 21:55, 2019-12-31 23:55, 0.012089, incipient, 2019-08-11 15:05
+    p142, 2019-06-12 19:55, 2019-07-17 09:25, 0.019857, abrupt, 2019-06-12 19:55
+    p680, 2019-07-10 08:45, 2019-12-31 23:55, 0.0097197, abrupt, 2019-07-10 08:45
+    p586, 2019-07-26 14:40, 2019-09-16 03:20, 0.017184, incipient, 2019-08-28 07:55
+    p721, 2019-08-02 03:00, 2019-12-31 23:55, 0.01408, incipient, 2019-09-23 05:40
+    p800, 2019-08-16 14:00, 2019-10-01 16:35, 0.018847, incipient, 2019-09-07 21:05
+    p123, 2019-09-13 20:05, 2019-12-31 23:55, 0.011906, incipient, 2019-11-29 22:10
+    p455, 2019-10-03 14:00, 2019-12-31 23:55, 0.012722, incipient, 2019-12-16 05:25
+    p762, 2019-10-09 10:15, 2019-12-31 23:55, 0.01519, incipient, 2019-12-03 01:15
+    p426, 2019-10-25 13:25, 2019-12-31 23:55, 0.015008, abrupt, 2019-10-25 13:25
+    p879, 2019-11-20 11:55, 2019-12-31 23:55, 0.013195, incipient, 2019-12-31 23:55"""