PyPI - openstef - Versions diffs - 3.4.56__py3-none-any.whl → 4.0.0a3__py3-none-any.whl - Mend

openstef 3.4.56py3-none-any.whl → 4.0.0a3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (104) hide show

openstef-4.0.0a3.dist-info/METADATA +177 -0
openstef-4.0.0a3.dist-info/RECORD +4 -0
{openstef-3.4.56.dist-info → openstef-4.0.0a3.dist-info}/WHEEL +1 -2
openstef/__init__.py +0 -14
openstef/__main__.py +0 -3
openstef/app_settings.py +0 -19
openstef/data/NL_terrestrial_radiation.csv +0 -25585
openstef/data/NL_terrestrial_radiation.csv.license +0 -3
openstef/data/dazls_model_3.4.24/dazls_stored_3.4.24_baseline_model.z +0 -0
openstef/data/dazls_model_3.4.24/dazls_stored_3.4.24_baseline_model.z.license +0 -3
openstef/data/dazls_model_3.4.24/dazls_stored_3.4.24_model_card.md +0 -18
openstef/data/dazls_model_3.4.24/dazls_stored_3.4.24_model_card.md.license +0 -3
openstef/data/dutch_holidays.csv +0 -1759
openstef/data/dutch_holidays.csv.license +0 -3
openstef/data/pv_single_coefs.csv +0 -601
openstef/data/pv_single_coefs.csv.license +0 -3
openstef/data_classes/__init__.py +0 -3
openstef/data_classes/data_prep.py +0 -99
openstef/data_classes/model_specifications.py +0 -30
openstef/data_classes/prediction_job.py +0 -135
openstef/data_classes/split_function.py +0 -97
openstef/enums.py +0 -140
openstef/exceptions.py +0 -74
openstef/feature_engineering/__init__.py +0 -3
openstef/feature_engineering/apply_features.py +0 -138
openstef/feature_engineering/bidding_zone_to_country_mapping.py +0 -106
openstef/feature_engineering/cyclic_features.py +0 -161
openstef/feature_engineering/data_preparation.py +0 -152
openstef/feature_engineering/feature_adder.py +0 -206
openstef/feature_engineering/feature_applicator.py +0 -202
openstef/feature_engineering/general.py +0 -141
openstef/feature_engineering/holiday_features.py +0 -231
openstef/feature_engineering/lag_features.py +0 -165
openstef/feature_engineering/missing_values_transformer.py +0 -141
openstef/feature_engineering/rolling_features.py +0 -58
openstef/feature_engineering/weather_features.py +0 -492
openstef/metrics/__init__.py +0 -3
openstef/metrics/figure.py +0 -303
openstef/metrics/metrics.py +0 -486
openstef/metrics/reporter.py +0 -222
openstef/model/__init__.py +0 -3
openstef/model/basecase.py +0 -82
openstef/model/confidence_interval_applicator.py +0 -242
openstef/model/fallback.py +0 -77
openstef/model/metamodels/__init__.py +0 -3
openstef/model/metamodels/feature_clipper.py +0 -90
openstef/model/metamodels/grouped_regressor.py +0 -222
openstef/model/metamodels/missing_values_handler.py +0 -138
openstef/model/model_creator.py +0 -214
openstef/model/objective.py +0 -426
openstef/model/objective_creator.py +0 -65
openstef/model/regressors/__init__.py +0 -3
openstef/model/regressors/arima.py +0 -197
openstef/model/regressors/custom_regressor.py +0 -64
openstef/model/regressors/dazls.py +0 -116
openstef/model/regressors/flatliner.py +0 -95
openstef/model/regressors/gblinear_quantile.py +0 -334
openstef/model/regressors/lgbm.py +0 -29
openstef/model/regressors/linear.py +0 -90
openstef/model/regressors/linear_quantile.py +0 -305
openstef/model/regressors/regressor.py +0 -114
openstef/model/regressors/xgb.py +0 -52
openstef/model/regressors/xgb_multioutput_quantile.py +0 -261
openstef/model/regressors/xgb_quantile.py +0 -228
openstef/model/serializer.py +0 -431
openstef/model/standard_deviation_generator.py +0 -81
openstef/model_selection/__init__.py +0 -3
openstef/model_selection/model_selection.py +0 -311
openstef/monitoring/__init__.py +0 -3
openstef/monitoring/performance_meter.py +0 -92
openstef/monitoring/teams.py +0 -203
openstef/pipeline/__init__.py +0 -3
openstef/pipeline/create_basecase_forecast.py +0 -133
openstef/pipeline/create_component_forecast.py +0 -168
openstef/pipeline/create_forecast.py +0 -171
openstef/pipeline/optimize_hyperparameters.py +0 -317
openstef/pipeline/train_create_forecast_backtest.py +0 -163
openstef/pipeline/train_model.py +0 -561
openstef/pipeline/utils.py +0 -52
openstef/postprocessing/__init__.py +0 -3
openstef/postprocessing/postprocessing.py +0 -275
openstef/preprocessing/__init__.py +0 -3
openstef/preprocessing/preprocessing.py +0 -42
openstef/settings.py +0 -15
openstef/tasks/__init__.py +0 -3
openstef/tasks/calculate_kpi.py +0 -324
openstef/tasks/create_basecase_forecast.py +0 -118
openstef/tasks/create_components_forecast.py +0 -162
openstef/tasks/create_forecast.py +0 -145
openstef/tasks/create_solar_forecast.py +0 -420
openstef/tasks/create_wind_forecast.py +0 -80
openstef/tasks/optimize_hyperparameters.py +0 -135
openstef/tasks/split_forecast.py +0 -273
openstef/tasks/train_model.py +0 -224
openstef/tasks/utils/__init__.py +0 -3
openstef/tasks/utils/dependencies.py +0 -107
openstef/tasks/utils/predictionjobloop.py +0 -243
openstef/tasks/utils/taskcontext.py +0 -160
openstef/validation/__init__.py +0 -3
openstef/validation/validation.py +0 -322
openstef-3.4.56.dist-info/METADATA +0 -154
openstef-3.4.56.dist-info/RECORD +0 -102
openstef-3.4.56.dist-info/top_level.txt +0 -1
/openstef-3.4.56.dist-info/LICENSE → /openstef-4.0.0a3.dist-info/licenses/LICENSE.md +0 -0

openstef/feature_engineering/weather_features.py DELETED Viewed

@@ -1,492 +0,0 @@
-# SPDX-FileCopyrightText: 2017-2023 Contributors to the OpenSTEF project <korte.termijn.prognoses@alliander.com> # noqa E501>
-#
-# SPDX-License-Identifier: MPL-2.0
-"""This module contains all wheather related functions used for feature engineering."""
-import logging
-from typing import Union
-import numpy as np
-import pandas as pd
-import pvlib
-import structlog
-from pvlib.location import Location
-from openstef.data_classes.prediction_job import PredictionJobDataClass
-from openstef.settings import Settings
-structlog.configure(
-    wrapper_class=structlog.make_filtering_bound_logger(
-        logging.getLevelName(Settings.log_level)
-    )
-)
-logger = structlog.get_logger(__name__)
-# Set some (nameless) constants for the Antoine equation:
-A: float = 6.116
-M: float = 7.6
-TN: float = 240.7
-# Set some constants
-TORR: float = 133.322368  # 1 torr = 133 Pa
-# 1.168 is the mass of 1 m^3 of air on sea level with standard pressure.
-D: float = 1.168
-DEFAULT_LAT: float = 52.132633
-DEFAULT_LON: float = 5.291266
-def calc_saturation_pressure(
-    temperature: Union[float, np.ndarray]
-) -> Union[float, np.ndarray]:
-    """Calculate the water vapour pressure from the temperature.
-    See https://www.vaisala.com/sites/default/files/documents/Humidity_Conversion_Formulas_B210973EN-F.pdf.
-    Args:
-        temperature: Temperature in C
-    Returns:
-        The saturation pressure of water at the respective temperature
-    """
-    psat = A * 10 ** ((M * temperature) / (temperature + TN))
-    return psat
-def calc_vapour_pressure(
-    rh: Union[float, np.ndarray], psat: Union[float, np.ndarray]
-) -> Union[float, np.ndarray]:
-    """Calculates the vapour pressure.
-    Args:
-        rh: Relative humidity
-        psat: Saturation pressure: see calc_saturation_pressure
-    Returns:
-        The water vapour pressure
-    """
-    return rh * psat
-def calc_dewpoint(
-    vapour_pressure: Union[float, np.ndarray]
-) -> Union[float, np.ndarray]:
-    """Calculates the dewpoint, see https://en.wikipedia.org/wiki/Dew_point for mroe info.
-    Args:
-        vapour_pressure: The vapour pressure for which the dewpoint should be calculated
-    Returns:
-        Dewpoint
-    """
-    return TN / ((M / np.log10(vapour_pressure / A)) - 1)
-def calc_air_density(
-    temperature: Union[float, np.ndarray],
-    pressure: Union[float, np.ndarray],
-    rh: Union[float, np.ndarray],
-) -> Union[float, np.ndarray]:
-    """Calculates the dewpoint.
-    Args:
-        temperature: The temperature in C
-        pressure: the atmospheric pressure in Pa
-        rh: Relative humidity
-    Returns:
-        The air density (kg/m^3)
-    """
-    # Calculate saturation pressure
-    psat = calc_saturation_pressure(temperature)
-    # Calculate the current vapour pressure
-    vapour_pressure = calc_vapour_pressure(rh, psat)
-    # Set tempareture to K
-    temperature_k = temperature + 273.15
-    # Calculate air density
-    air_density = (
-        D
-        * (273.15 / temperature_k)
-        * ((pressure - 0.3783 * vapour_pressure) / 760 / TORR)
-    )
-    return air_density
-def add_humidity_features(
-    data: pd.DataFrame, feature_names: list[str] = None
-) -> pd.DataFrame:
-    """Adds humidity features to the input dataframe.
-    These features are calculated using functions defines in this module. A list of
-    requested features is used to determine whether to add the humidity features or not.
-    Args:
-        data: Input dataframe to which features have to be added
-        feature_names: list of requested features.
-    Returns:
-        Same as input dataframe with extra columns for the humidty features.
-    """
-    # If features is none add humidity feature anyway
-    if feature_names is None:
-        humidity_features = True
-    # Otherwise check if they are among the reuqested features
-    else:
-        humidity_features = any(
-            x
-            in [
-                "saturation_pressure",
-                "vapour_pressure",
-                "dewpoint",
-                "air_density",
-            ]
-            for x in feature_names
-        )
-    # Check if any of the humidity features are requested and add them
-    if humidity_features:
-        # Try to add humidity  calculations, ignore if required columns are missing
-        try:
-            humidity_df = humidity_calculations(data.temp, data.humidity, data.pressure)
-            data = data.join(humidity_df)
-        except AttributeError:
-            pass  # This happens when a required column for humidity_calculations
-            # is not present
-    return data
-def humidity_calculations(
-    temperature: Union[float, np.ndarray],
-    rh: Union[float, np.ndarray],
-    pressure: Union[float, np.ndarray],
-) -> Union[dict, np.ndarray]:
-    """Function that calculates weather features based on humidity..
-    These features are:
-        - Saturation pressure
-        - Vapour pressure
-        - Dewpoint
-        - Air density
-    Args:
-        temperature: Temperature in C
-        rh: Relative humidity in %
-        pressure: The air pressure in hPa
-    Returns:
-        If the input is an np.ndarray; a pandas dataframe with the calculated moisture indices,
-        if the input is numeric; a dict with the calculated moisture indices
-    """
-    # First: a sanity check on the relative humidity and the air pressure
-    # We only check on the type of temperature, because they need to be the same anyway
-    is_series = isinstance(temperature, (np.ndarray, pd.Series))
-    is_scalar = isinstance(temperature, (float, int))
-    if is_scalar is False and is_series is False:
-        raise TypeError(
-            "The input should be a pandas series or np.ndarry, or float or int"
-        )
-    # Suppres copy warnings
-    with pd.option_context("mode.chained_assignment", None):
-        if is_series:
-            rh[rh > 1] = rh / 100  # This triggers copy warnings
-            pressure[pressure < 80000] = np.nan  # This triggers copy warnings
-        else:
-            if rh > 1:
-                rh /= 100
-            if pressure < 80000:
-                pressure = np.nan
-    # If the input is a dataframe or np.ndarrays: return a dataframe
-    if is_series:
-        humidity_df = pd.DataFrame(
-            columns=[
-                "saturation_pressure",
-                "vapour_pressure",
-                "dewpoint",
-                "air_density",
-            ]
-        )
-        humidity_df["saturation_pressure"] = calc_saturation_pressure(temperature)
-        humidity_df["vapour_pressure"] = calc_vapour_pressure(
-            rh, humidity_df.saturation_pressure
-        )
-        humidity_df["dewpoint"] = calc_dewpoint(humidity_df.vapour_pressure)
-        humidity_df["air_density"] = calc_air_density(temperature, pressure, rh)
-        return humidity_df
-    # Else: if the input is numeric: return a dict
-    psat = calc_saturation_pressure(temperature)
-    pw = calc_vapour_pressure(rh, psat)
-    td = calc_dewpoint(pw)
-    air_density = calc_air_density(temperature, pressure, rh)
-    return {
-        "saturation_pressure": psat,
-        "vapour_pressure": pw,
-        "dewpoint": td,
-        "air_density": air_density,
-    }
-def calculate_windspeed_at_hubheight(
-    windspeed: Union[float, pd.Series],
-    fromheight: float = 10.0,
-    hub_height: float = 100.0,
-) -> pd.Series:
-    """Calculate windspeed at hubheight.
-    Calculates the windspeed at hubheigh by extrapolation from a given height to a given
-    hub height using the wind power law https://en.wikipedia.org/wiki/Wind_profile_power_law
-    Args:
-        windspeed: float OR pandas series of windspeed at height = height
-        fromheight: height (m) of the windspeed data. Default is 10m
-        hubheight: height (m) of the turbine
-    Returns:
-        Windspeed at hubheight.
-    """
-    alpha = 0.143
-    if not isinstance(windspeed, (np.ndarray, float, int, pd.Series)):
-        raise TypeError(
-            "The windspeed is not of the expected type!\n                        Got"
-            " {}, expected np.ndarray, pd series or numeric".format(type(windspeed))
-        )
-    try:
-        if any(windspeed < 0):
-            raise ValueError(
-                "The windspeed cannot be negative, as it is the lenght of a vector"
-            )
-    except TypeError:
-        if windspeed < 0:
-            raise ValueError(
-                "The windspeed cannot be negative, as it is the lenght of a vector"
-            )
-        windspeed = abs(windspeed)
-    return windspeed * (hub_height / fromheight) ** alpha
-def calculate_windturbine_power_output(
-    windspeed: pd.Series, n_turbines: int = 1, turbine_data: dict = None
-) -> pd.Series:
-    """Calculate wind turbine power output.
-    These values are related through the power curve, which is described by turbine_data.
-    If no turbine_data is given, default values are used and results are normalized to 1MWp.
-    If n_turbines=0, the result is normalized to a rated power of 1.
-    Args:
-        windspeed: pd.DataFrame(index = datetime, columns = ["windspeedHub"])
-        nTurbines: The number of turbines
-        turbineData: slope_center, rated_power, steepness
-    Returns:
-        pd.DataFrame(index = datetime, columns = ["forecast"])
-    """
-    if turbine_data is None:
-        turbine_data = {
-            "name": "Lagerwey L100",  # not used here
-            "cut_in": 3,  # not used here
-            "cut_off": 25,  # not used here
-            "kind": "onshore",  # not used here
-            "manufacturer": "Lagerwey",  # not used here
-            "peak_capacity": 1,  # not used here
-            "rated_power": 1,
-            "slope_center": 8.07,
-            "steepness": 0.664,
-        }
-    else:
-        required_properties = ["rated_power", "steepness", "slope_center"]
-        for prop in required_properties:
-            if prop not in turbine_data.keys():
-                raise KeyError(f"Required property '{prop}' not set in turbine data")
-    generated_power = turbine_data["rated_power"] / (
-        1
-        + np.exp(
-            -turbine_data["steepness"] * (windspeed - turbine_data["slope_center"])
-        )
-    )
-    generated_power *= n_turbines
-    return generated_power
-def add_additional_wind_features(
-    data: pd.DataFrame, feature_names: list[str] = None
-) -> pd.DataFrame:
-    """Adds additional wind features to the input data.
-    Args:
-        data: Dataframe to which the wind features have to be added
-        feature_names: List of requested features
-    Returns:
-        DataFrame same as input dataframe with extra columns for the added wind features
-    """
-    if feature_names is None:
-        additional_wind_features = True
-    else:
-        additional_wind_features = any(
-            x
-            in [
-                "windspeed_100mExtrapolated",
-                "windPowerFit_extrapolated",
-                "windpowerFit_harm_arome",
-            ]
-            for x in feature_names
-        )
-    # Add add_additional_wind_features
-    if "windspeed" in data.columns and additional_wind_features:
-        data["windspeed_100mExtrapolated"] = calculate_windspeed_at_hubheight(
-            data["windspeed"]
-        )
-        data["windPowerFit_extrapolated"] = calculate_windturbine_power_output(
-            data["windspeed_100mExtrapolated"]
-        )
-    # Do extra check
-    if "windspeed_100m" in data.columns and additional_wind_features:
-        data["windpowerFit_harm_arome"] = calculate_windturbine_power_output(
-            data["windspeed_100m"].astype(float)
-        )
-    return data
-def calculate_dni(radiation: pd.Series, pj: PredictionJobDataClass) -> pd.Series:
-    """Calculate the direct normal irradiance (DNI).
-    This function uses the predicted radiation and information derived from the location (obtained from pj)
-    Args:
-        radiation: predicted radiation including DatetimeIndex with right time-zone
-        pj: PredictJob including information about the location (lat, lon)
-    Returns:
-        Direct normal irradiance (DNI).
-    """
-    loc = Location(pj.get("lat", DEFAULT_LAT), pj.get("lon", DEFAULT_LON), tz="utc")
-    times = radiation.index
-    # calculate data for loc(ation) at times with clear_sky, as if there would be a clear sky.
-    cs = loc.get_clearsky(times)
-    # get solar position variable(s) for loc(ation) at times
-    solpos = pvlib.solarposition.get_solarposition(times, loc.latitude, loc.longitude)
-    solar_zenith = solpos.apparent_zenith
-    # convert radiation (ghi) to right unit (J/m^2 to kWh/m^2)
-    # TODO: check whether unit conversion is necessary
-    ghi_forecasted = radiation / 3600
-    # convert ghi to dni
-    dni_converted = pvlib.irradiance.dni(
-        ghi_forecasted, cs.dhi, solar_zenith, clearsky_dni=cs.dni
-    )
-    dni_converted = dni_converted.fillna(0)
-    return dni_converted
-def calculate_gti(
-    radiation: pd.Series,
-    pj: PredictionJobDataClass,
-    surface_tilt: float = 34.0,
-    surface_azimuth: float = 180,
-) -> pd.Series:
-    """Calculate the GTI/POA using the radiation.
-    This function assumes Global Tilted Irradiance (GTI) = Plane of Array (POA)
-    Args:
-        radiation: pandas series with DatetimeIndex with right timezone information
-        pj: prediction job which should at least contain the latitude and longitude location.
-        surface_tilt: The tilt of the surface of, for example, your PhotoVoltaic-system.
-        surface_azimuth: The way the surface is facing. South facing 180 degrees, North facing 0 degrees, East facing 90 degrees and West facing 270 degrees
-    Returns:
-        Global Tilted Irradiance (GTI)
-    """
-    loc = Location(pj.get("lat", DEFAULT_LAT), pj.get("lon", DEFAULT_LON), tz="utc")
-    times = radiation.index
-    # calculate data for loc(ation) at times with clear_sky, as if there would be a clear sky.
-    cs = loc.get_clearsky(times)
-    dni = calculate_dni(radiation, pj)
-    # get solar position variable(s) for loc(ation) at times
-    solpos = pvlib.solarposition.get_solarposition(times, loc.latitude, loc.longitude)
-    solar_zenith = solpos.apparent_zenith
-    solar_azimuth = solpos.azimuth
-    ghi_forecasted = radiation / 3600
-    gti = pvlib.irradiance.get_total_irradiance(
-        surface_tilt,
-        surface_azimuth,
-        solar_zenith,
-        solar_azimuth,
-        dni=dni,
-        ghi=ghi_forecasted,
-        dhi=cs.dhi,
-    )
-    return gti["poa_global"]
-def add_additional_solar_features(
-    data: pd.DataFrame,
-    pj: PredictionJobDataClass = None,
-    feature_names: list[str] = None,
-) -> pd.DataFrame:
-    """Adds additional solar features to the input data.
-    Args:
-        data: Dataframe to which the solar features have to be added
-        pj: prediction job which should at least contain the latitude and longitude location.
-        feature_names: List of requested features
-    Returns:
-        DataFrame same as input dataframe with extra columns for the added solar features
-    """
-    # If pj is none add solar features with Utrecht as default location
-    if pj is None:
-        logger.info(
-            "No prediction job, default location will be used for additional radiation features."
-        )
-        pj = {"lat": DEFAULT_LAT, "lon": DEFAULT_LON}
-    # If features is none add solar feature anyway
-    if feature_names is None:
-        additional_solar_features = True
-    # Otherwise check if they are among the requested features
-    else:
-        additional_solar_features = any(x in ["dni", "gti"] for x in feature_names)
-    # Add add_additional_solar_features
-    if "radiation" in data.columns and additional_solar_features:
-        data["dni"] = calculate_dni(data["radiation"], pj)
-        data["gti"] = calculate_gti(data["radiation"], pj)
-    return data

openstef/metrics/__init__.py DELETED Viewed

@@ -1,3 +0,0 @@
-# SPDX-FileCopyrightText: 2017-2023 Contributors to the OpenSTEF project <korte.termijn.prognoses@alliander.com> # noqa E501>
-#
-# SPDX-License-Identifier: MPL-2.0

openstef 3.4.56__py3-none-any.whl → 4.0.0a3__py3-none-any.whl

openstef 3.4.56py3-none-any.whl → 4.0.0a3py3-none-any.whl