PyPI - BackboneTools - Versions diffs - 2025.0.0a0__tar.gz - Mend

BackboneTools 2025.0.0a0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (10) hide show

backbonetools-2025.0.0a0/.gitignore +10 -0
backbonetools-2025.0.0a0/PKG-INFO +16 -0
backbonetools-2025.0.0a0/README.md +1 -0
backbonetools-2025.0.0a0/backbonetools/__init__.py +0 -0
backbonetools-2025.0.0a0/backbonetools/io/exec.py +175 -0
backbonetools-2025.0.0a0/backbonetools/io/input.py +298 -0
backbonetools-2025.0.0a0/backbonetools/io/output.py +562 -0
backbonetools-2025.0.0a0/pyproject.toml +29 -0
backbonetools-2025.0.0a0/setup.py +7 -0
backbonetools-2025.0.0a0/uv.lock +514 -0

backbonetools-2025.0.0a0/.gitignore ADDED Viewed

@@ -0,0 +1,10 @@
+*.py[cod]
+*.pyo
+*.pyd
+*.egg-info/
+dist/
+build/
+*.egg
+*.whl
+__pycache__/
+*.gdx

backbonetools-2025.0.0a0/PKG-INFO ADDED Viewed

@@ -0,0 +1,16 @@
+Metadata-Version: 2.4
+Name: BackboneTools
+Version: 2025.0.0a0
+Summary: BackboneTools is a Python package for working with Backbone.
+Project-URL: Repository, https://gitlab.ruhr-uni-bochum.de/ee/backbonetools.git
+Author-email: David Huckebrink <david.huckebrink@rub.de>, Leonie Plaga <leonie.plaga@rub.de>
+Requires-Dist: gamsapi
+Requires-Dist: matplotlib
+Requires-Dist: numpy
+Requires-Dist: openpyxl
+Requires-Dist: pandas
+Requires-Dist: plotly
+Requires-Dist: tsam
+Description-Content-Type: text/markdown
+hello world

backbonetools-2025.0.0a0/README.md ADDED Viewed

	@@ -0,0 +1 @@
1	+ hello world

backbonetools-2025.0.0a0/backbonetools/__init__.py ADDED Viewed

File without changes

backbonetools-2025.0.0a0/backbonetools/io/exec.py ADDED Viewed

@@ -0,0 +1,175 @@
+"""
+backbonetools - create, modify and visualise input and output data for the esm backbone and run backbone
+Copyright (C) 2020-2025 Leonie Plaga, David Huckebrink, Christine Nowak, Jan Mutke, Jonas Finke, Silke Johanndeiter, Sophie Pathe
+This program is free software: you can redistribute it and/or modify
+it under the terms of the GNU General Public License as published by
+the Free Software Foundation, either version 3 of the License, or
+(at your option) any later version.
+This program is distributed in the hope that it will be useful,
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+You should have received a copy of the GNU General Public License
+along with this program.  If not, see <http://www.gnu.org/licenses/>.
+"""
+import os
+import subprocess as sp
+from glob import glob
+from multiprocessing.pool import ThreadPool
+from pathlib import Path
+from backbonetools.io.input import BackboneInput
+from backbonetools.io.output import BackboneResult
+def run_backbone(
+    input_dir,
+    input_file_gdx,
+    output_dir,
+    output_file=None,
+    backbone_dir=None,
+    **kwargs,
+):
+    """runs Backbone with the specified arguments
+    Args:
+        input_dir (str): Path to the input directory for Backbone to read configurations (e.g. `investInit.gms`)
+        input_file_gdx (str): Path to the Backbone input file
+        output_dir (str): Path to the output directory, where results shall be written
+        output_file (str): Name of the Backbone result file
+        backbone_dir (str, optional): Path to the Backbone Framework. Defaults to the path of the submodule in this repository.
+    """
+    # if not specified, derive from input_file_gdx
+    if not output_file:
+        output_file = Path(input_file_gdx).stem + "_result.gdx"
+    # if not specified, set backbone_dir to submodule path
+    if not backbone_dir:
+        backbone_dir = Path(__file__).parent.parent.joinpath("backbone")
+    # keyword arguments are parsed into backbone suitable form
+    # e.g. dict(maxTotalCost=42) will be passed as "--maxTotalCost=42" to backbone
+    keyword_args = [f"--{k}={v}" for k, v in kwargs.items()]
+    # spaces in file names don't work through subprocesses
+    contain_spaces = [
+        " " in str(file_or_dir)
+        for file_or_dir in [input_dir, input_file_gdx, output_dir, output_file]
+    ]
+    if any(contain_spaces):
+        raise ValueError(
+            "Passing paths with spaces via subprocess to Gams is not supported yet."
+        )
+    # absolute paths are better for gams
+    input_dir = Path(input_dir).absolute().as_posix()
+    input_file_gdx = Path(input_file_gdx).absolute().as_posix()
+    output_dir = Path(output_dir).absolute().as_posix()
+    Path(input_dir).mkdir(exist_ok=True)
+    Path(output_dir).mkdir(exist_ok=True)
+    process_output = sp.run(
+        [
+            "gams",
+            "Backbone.gms",
+            f"--input_dir={input_dir}",
+            f"--input_file_gdx={input_file_gdx}",
+            f"--output_dir={output_dir}",
+            f"--output_file={output_file}",
+            *keyword_args,
+        ],
+        cwd=backbone_dir,
+        stdout=sp.PIPE,
+        stderr=sp.PIPE,
+        # text= True
+    )
+    # stdout, stderr = process_output.communicate()
+    # write terminal output to a file
+    open(f"{output_dir}/{Path(output_file).stem}_terminal.log", "w").write(
+        process_output.stdout.decode()
+    )
+    open(f"{output_dir}/{Path(output_file).stem}_error.log", "w").write(
+        process_output.stderr.decode()
+    )
+    print("finished", output_file)
+    return Path(output_dir).joinpath(output_file).absolute()
+def sensitivity(
+    input_file_gdx,
+    bb_input_dir,
+    output_dir=None,
+    parallel=True,
+    param="CO2",
+    percentages=[0.05, 0.1, 0.2, 0.4, 0.8],
+):
+    if param != "CO2":
+        raise NotImplementedError(
+            f"sensitivity not yet implemented for parameters other than {param}."
+        )
+    sensitivity_dir = Path(input_file_gdx).parent
+    sensitivity_input_dir = f"{sensitivity_dir}/{param}_inputs"
+    if not output_dir:
+        sensitivity_output_dir = f"{sensitivity_dir}/{param}_outputs"
+    else:
+        sensitivity_output_dir = output_dir
+    # create directories
+    Path(sensitivity_input_dir).mkdir(exist_ok=True)
+    Path(sensitivity_output_dir).mkdir(exist_ok=True)
+    bb_in = BackboneInput(input_file_gdx)
+    bb_opt_fn = bb_in._path.stem + f"_100{param}_result.gdx"
+    # run first optimisation i.e. 100% of `param`
+    bb_out_path = run_backbone(
+        bb_input_dir,
+        input_file_gdx=bb_in._path,
+        output_dir=sensitivity_output_dir,
+        output_file=bb_opt_fn,
+    )
+    # from scripts.results import BackboneResult
+    bb_result = BackboneResult(bb_out_path)
+    bb_result.r_emission()
+    emission_lims = bb_result.r_emission()["Val"].values * percentages
+    # percentages,emission_lims
+    for percentage, em_lim in zip(percentages, emission_lims):
+        new_db = bb_in.update_gams_parameter_in_db(
+            "p_groupPolicyEmission",
+            ["emission group", "emissionCap", "CO2"],
+            value=em_lim,
+        )
+        out_fn = Path(bb_in._path).stem + f"_{percentage*100:02.0f}{param}"
+        Path(sensitivity_input_dir).mkdir(exist_ok=True)
+        new_db.export(f"{sensitivity_input_dir}/{out_fn}.gdx")
+    input_files = list(glob(f"{sensitivity_input_dir}/*.gdx"))
+    result_paths = []
+    if parallel:
+        threads = os.cpu_count() - 1
+        with ThreadPool(threads) as pool:
+            jobs = []
+            for file in input_files:
+                job = pool.apply_async(
+                    run_backbone, (bb_input_dir, file, sensitivity_output_dir)
+                )
+                jobs.append(job)
+            result_paths = [job.get() for job in jobs]
+    else:
+        for file in input_files:
+            path = run_backbone(bb_input_dir, file, sensitivity_output_dir)
+            result_paths.append(path)
+    return result_paths

backbonetools-2025.0.0a0/backbonetools/io/input.py ADDED Viewed

@@ -0,0 +1,298 @@
+"""
+backbonetools - create, modify and visualise input and output data for the esm backbone and run backbone
+Copyright (C) 2020-2025 Leonie Plaga, David Huckebrink, Christine Nowak, Jan Mutke, Jonas Finke, Silke Johanndeiter, Sophie Pathe
+This program is free software: you can redistribute it and/or modify
+it under the terms of the GNU General Public License as published by
+the Free Software Foundation, either version 3 of the License, or
+(at your option) any later version.
+This program is distributed in the hope that it will be useful,
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+You should have received a copy of the GNU General Public License
+along with this program.  If not, see <http://www.gnu.org/licenses/>.
+"""
+import subprocess as sp
+import warnings
+from functools import partial, reduce
+from io import StringIO
+from itertools import groupby
+from pathlib import Path
+import pandas as pd
+import tsam.timeseriesaggregation as tsam
+from gams import GamsDatabase, GamsException, GamsSetRecord, GamsWorkspace
+class BackboneInput:
+    def __init__(self, path):
+        # this section is redundant with results.BackboneResult
+        ws = GamsWorkspace(".")
+        self._path = Path(path).absolute()
+        if not self._path.exists():
+            raise FileNotFoundError(self._path)
+        self.gams_db = ws.add_database_from_gdx(self._path.as_posix())
+        self.set_symbols_as_attribs()
+    @property
+    def input_symbols(self):
+        if hasattr(self, "_symbols"):
+            return self._symbols
+        # get all symbols from the gams database
+        # list comprehension of gams_db raises an exception at the last index
+        symbols = []
+        try:
+            for p in self.gams_db:
+                symbols.append(p.name)
+        except GamsException as ge:
+            if "out of range" in str(ge) and str(self.gams_db.number_symbols) in str(
+                ge
+            ):
+                pass
+            else:
+                raise ge
+        self._symbols = symbols
+        return symbols
+    def set_symbols_as_attribs(self):
+        """
+        Sets all input symbols as methods. Allows for easy access like
+        `bb_input.p_gnu_io()` or `bb_input.ts_influx()`"""
+        for symbol in self.input_symbols:
+            setattr(self, symbol, partial(self.param_as_df_gdxdump, symbol))
+    def param_as_df_gdxdump(
+        self, symbol, encoding="1252", convert_time=True
+    ) -> pd.DataFrame:
+        """Use the 'gdxdump' GAMS utility via subprocess to convert a parameter into a pd.DataFrame.
+        This is sometimes beneficial, to circumvent decoding errors
+        """
+        gdxdump = sp.run(
+            ["gdxdump", self._path, "format", "csv", "symb", symbol], stdout=sp.PIPE
+        )
+        csv_data = gdxdump.stdout.decode(encoding=encoding)
+        header = csv_data.partition("\n")[0]
+        header = [x.strip('"') for x in header.split(",")]
+        dtypes = [str if x != "Val" else float for x in header]
+        dtypes = dict(zip(header, dtypes))
+        df = pd.read_csv(StringIO(csv_data), dtype=dtypes, na_values="Eps")
+        if df.empty:
+            return df
+        # converts the time column to int by omitting the first character
+        try:
+            if convert_time:
+                if "t" in df.columns:
+                    df["t"] = df["t"].apply(lambda t: int(t[1:]))
+                else:
+                    # for backbone inputs, the index is ["Dim1", "Dim2", ... , "Val"], but there might be a time column
+                    first_row = df.loc[0]
+                    is_time = first_row.apply(lambda x: str(x).startswith("t000"))
+                    if any(is_time):
+                        # any is necessary, otherwise *.idxmax()  simply returns first element
+                        time_col = is_time.idxmax()  # should be something like "Dim4"
+                        df[time_col] = df[time_col].apply(lambda t: int(t[1:]))
+                        df.rename({time_col: "t"}, axis=1, inplace=True)
+        except Exception as e:
+            print(f"Error during time conversion for {symbol=}, {df=}")
+        return df
+    def update_gams_parameter_in_db(
+        self,
+        param_name: str,
+        indices: list,
+        value: float = None,
+        apply_percentage: float = None,
+    ) -> GamsDatabase:
+        # note that you are always only working on the same instance of the database.
+        # retrieve the parameter i.e. "p_groupPolicyEmission"
+        parameter = self.gams_db.get_symbol(param_name)
+        # retrieve the record from that parameter i.e. ["emission group", "emissionCap", "CO2"]
+        try:
+            record = parameter.find_record(indices)
+        except GamsException as ge:
+            if "Cannot find" in ge.value:
+                # This is potentially dangerous since any index value can be added.
+                # However, in the case of a bad index, GAMS should throw a DomainViolationError
+                warnings.warn(
+                    f"Warning: Caught 'GamsException: {ge.value}'.\n\tSetting {indices} to {value}"
+                )
+                record = parameter.add_record(indices)
+            else:
+                raise ge
+        # add_record
+        if not apply_percentage and type(value) is not None:
+            if isinstance(record, GamsSetRecord):
+                # sets only have text i.e. "Y"
+                record.set_text(value)
+            else:
+                record.set_value(value)
+        elif apply_percentage:
+            current_val = record.get_value()
+            record.set_value(current_val * apply_percentage)
+        else:
+            raise ValueError("one of 'value' and 'apply_percentage' must be passed!")
+        return self.gams_db
+    def aggregate_timeseries(
+        self, export_path, hours_per_period=24 * 7, n_periods=3, err_indicators=None
+    ):
+        # err_indicators="print"|None
+        if err_indicators not in ("print", None):
+            raise NotImplementedError(
+                f" Only one of ('print',None) is supported for `err_indicators`, but {err_indicators=} was passed."
+            )
+        ts_params = ["ts_influx", "ts_node", "ts_unit", "ts_cf"]
+        ts_frames = []
+        drop_frames = []
+        # retrieve and transform timeseries data (not exaustive)
+        for p in ts_params:
+            p_df = self.param_as_df_gdxdump(p)
+            if p_df.empty:
+                drop_frames.append(p)
+                continue
+            # index of the time column
+            time_col = list(p_df.columns).index("t")
+            # all the previous columns (time is usually the penultimate column)
+            index_cols = list(p_df.columns[:time_col])
+            # transform from long to wide dataformat
+            p_df = p_df.pivot(index="t", columns=index_cols, values="Val")
+            # join column names from different levels and prepend param_name
+            # these will come in handy, when writing aggregated data to the *.gdx
+            # col is tuple, thus must be converted to a list to be mutable
+            p_df.columns = ["|".join([p] + list(col)) for col in p_df.columns]
+            ts_frames.append(p_df)
+        # merge ts_frames to a single dataframe
+        ts_df = reduce(
+            lambda left, right: pd.merge(
+                left, right, left_index=True, right_index=True, how="outer"
+            ),
+            ts_frames,
+        )
+        # create and set a datetimeindex
+        dateindex = pd.date_range(start="2020-01-01 00:00", periods=8760, freq="h")
+        ts_df.set_index(dateindex, inplace=True)
+        ts_df.fillna(0, inplace=True)
+        # create aggregation
+        aggregation = tsam.TimeSeriesAggregation(
+            ts_df,
+            hoursPerPeriod=hours_per_period,
+            noTypicalPeriods=n_periods,
+            clusterMethod="adjacent_periods",
+            representationMethod="distributionAndMinMaxRepresentation",
+        )
+        # calculate the typical periods
+        typeriods = aggregation.createTypicalPeriods()
+        if err_indicators == "print":
+            print(aggregation.accuracyIndicators())
+        # get the sequence and number of occurances
+        period_sequence = [
+            (k, sum(1 for i in g)) for k, g in groupby(aggregation.clusterOrder)
+        ]
+        # concatenate
+        ts_input_data = pd.concat(
+            [typeriods.loc[period_no, :] for period_no, _ in period_sequence]
+        ).reset_index(drop=True)
+        # write data to gdx
+        for col_name in ts_input_data.columns:
+            # recreate the indices from the column names
+            bb_indices = col_name.split("|")
+            for i, val in enumerate(ts_input_data[col_name].values):
+                timestep = f"t{i + 1:06}"
+                self.update_gams_parameter_in_db(
+                    bb_indices[0], bb_indices[1:] + [timestep], val
+                )
+        # add samples to .gdx where nessesary
+        samples_and_lengths = [
+            {
+                "name": f"s{i:03}",
+                "length": hours_per_period,
+                "weight": tup[1],
+                "cluster_no": tup[0],
+            }
+            for i, tup in enumerate(period_sequence)
+        ]
+        sample_df = pd.DataFrame.from_records(samples_and_lengths, index="name")
+        sample_names = sample_df.index.to_list()
+        if "p_s_discountFactor" not in self.input_symbols:
+            self.gams_db.add_parameter_dc("p_s_discountFactor", ["s"])
+        for sample in sample_df.index:
+            self.update_gams_parameter_in_db("p_s_discountFactor", [sample], value=1)
+            # : ["sample",	"group"]
+            self.update_gams_parameter_in_db(
+                "sGroup", [sample, "emission group"], value="Y"
+            )
+            assert "emission group" in self.group().values
+        if len(self.group().values) > 2:
+            print(
+                f"Warning: samples have been added for group 'emission group' but more are present in the .gdx:{self.group().values}"
+            )
+        # bind samples in gnss_bound
+        # get nodes that have a state
+        p_gn = self.p_gn()
+        nodes_w_state = p_gn.query("Dim3=='energyStoredPerUnitOfState'")[
+            ["Dim1", "Dim2"]
+        ]
+        # nodes_w_state.append([nodes_w_state]*(len(sample_names)-1))
+        gnss_df = pd.concat([nodes_w_state] * len(sample_names))
+        gnss_df.sort_values(by="Dim2", inplace=True)
+        from_sample = []
+        to_sample = []
+        for i in range(len(gnss_df)):
+            from_sample.append(sample_names[i % len(sample_names)])
+            to_sample.append(sample_names[(i + 1) % len(sample_names)])
+        gnss_df["from_sample"] = from_sample
+        gnss_df["to_sample"] = to_sample
+        # clear records in bounds, because they might be invalid post-aggregation
+        gnss_bounds = self.gams_db.get_symbol("gnss_bound")
+        gnss_bounds.clear()
+        for gnss_indices in gnss_df.values:
+            # print(gnss_indices)
+            self.update_gams_parameter_in_db(
+                "gnss_bound", list(gnss_indices), value="Y"
+            )
+        print("Dont forget to update your bb input configuration!!")
+        for i, tup in enumerate(period_sequence):
+            print(
+                f"s{i:03} - cluster:{tup[0]} - weight:{tup[1]},\tlength: {hours_per_period}"
+            )
+        sample_df.to_csv(str(export_path) + "_sample_weights.csv")
+        self.gams_db.export(export_path)
+        pass