PyPI - mrio-toolbox - Versions diffs - 1.0.0__py3-none-any.whl → 1.1.2__py3-none-any.whl - Mend

mrio-toolbox 1.0.0py3-none-any.whl → 1.1.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of mrio-toolbox might be problematic. Click here for more details.

Files changed (67) hide show

__init__.py +21 -0
{mrio_toolbox/_parts → _parts}/_Axe.py +95 -37
{mrio_toolbox/_parts → _parts}/_Part.py +346 -111
_parts/__init__.py +7 -0
{mrio_toolbox/_parts → _parts}/part_operations.py +24 -17
extractors/__init__.py +20 -0
extractors/downloaders.py +36 -0
extractors/emerging/__init__.py +3 -0
extractors/emerging/emerging_extractor.py +117 -0
extractors/eora/__init__.py +3 -0
extractors/eora/eora_extractor.py +132 -0
extractors/exiobase/__init__.py +3 -0
extractors/exiobase/exiobase_extractor.py +270 -0
extractors/extractors.py +81 -0
extractors/figaro/__init__.py +3 -0
extractors/figaro/figaro_downloader.py +280 -0
extractors/figaro/figaro_extractor.py +187 -0
extractors/gloria/__init__.py +3 -0
extractors/gloria/gloria_extractor.py +202 -0
extractors/gtap11/__init__.py +7 -0
extractors/gtap11/extraction/__init__.py +3 -0
extractors/gtap11/extraction/extractor.py +129 -0
extractors/gtap11/extraction/harpy_files/__init__.py +6 -0
extractors/gtap11/extraction/harpy_files/_header_sets.py +279 -0
extractors/gtap11/extraction/harpy_files/har_file.py +262 -0
extractors/gtap11/extraction/harpy_files/har_file_io.py +974 -0
extractors/gtap11/extraction/harpy_files/header_array.py +300 -0
extractors/gtap11/extraction/harpy_files/sl4.py +229 -0
extractors/gtap11/gtap_mrio/__init__.py +6 -0
extractors/gtap11/gtap_mrio/mrio_builder.py +158 -0
extractors/icio/__init__.py +3 -0
extractors/icio/icio_extractor.py +121 -0
extractors/wiod/__init__.py +3 -0
extractors/wiod/wiod_extractor.py +143 -0
mrio_toolbox/mrio.py → mrio.py +254 -94
{mrio_toolbox-1.0.0.dist-info → mrio_toolbox-1.1.2.dist-info}/METADATA +11 -7
mrio_toolbox-1.1.2.dist-info/RECORD +59 -0
{mrio_toolbox-1.0.0.dist-info → mrio_toolbox-1.1.2.dist-info}/WHEEL +1 -1
mrio_toolbox-1.1.2.dist-info/top_level.txt +6 -0
msm/__init__.py +6 -0
msm/multi_scale_mapping.py +863 -0
utils/__init__.py +3 -0
utils/converters/__init__.py +5 -0
{mrio_toolbox/utils → utils}/converters/pandas.py +5 -6
{mrio_toolbox/utils → utils}/converters/xarray.py +6 -15
utils/formatting/formatter.py +527 -0
utils/loaders/__init__.py +7 -0
{mrio_toolbox/utils → utils}/loaders/_loader.py +60 -4
{mrio_toolbox/utils → utils}/loaders/_loader_factory.py +22 -1
{mrio_toolbox/utils → utils}/loaders/_nc_loader.py +37 -1
{mrio_toolbox/utils → utils}/loaders/_pandas_loader.py +29 -3
{mrio_toolbox/utils → utils}/loaders/_parameter_loader.py +61 -16
{mrio_toolbox/utils → utils}/savers/__init__.py +3 -0
utils/savers/_path_checker.py +37 -0
{mrio_toolbox/utils → utils}/savers/_to_folder.py +6 -1
utils/savers/_to_nc.py +60 -0
mrio_toolbox/__init__.py +0 -5
mrio_toolbox/_parts/__init__.py +0 -3
mrio_toolbox/utils/converters/__init__.py +0 -2
mrio_toolbox/utils/loaders/__init__.py +0 -3
mrio_toolbox/utils/savers/_path_checker.py +0 -19
mrio_toolbox/utils/savers/_to_nc.py +0 -52
mrio_toolbox-1.0.0.dist-info/RECORD +0 -26
mrio_toolbox-1.0.0.dist-info/top_level.txt +0 -1
{mrio_toolbox-1.0.0.dist-info → mrio_toolbox-1.1.2.dist-info/licenses}/LICENSE +0 -0
{mrio_toolbox/utils → utils/formatting}/__init__.py +0 -0
{mrio_toolbox/utils → utils}/loaders/_np_loader.py +0 -0

extractors/icio/__init__.py ADDED Viewed

@@ -0,0 +1,3 @@
+"""
+This module contains the ICIO extractor.
+"""

extractors/icio/icio_extractor.py ADDED Viewed

@@ -0,0 +1,121 @@
+# -*- coding: utf-8 -*-
+"""
+Created on Wed May 11 16:15:09 2022
+Major modifications on 04.02.2025 by wirth
+Load and convert ICIO MRIO files.
+Please put the Readme excel file in the same folder as the data and adjust the filename in the code.
+Supports ICIO 2021 in csv format
+https://www.oecd.org/sti/ind/inter-country-input-output-tables.htm
+@author: beaufils and wirth
+"""
+import os
+import logging
+import pandas as pd
+from mrio_toolbox import MRIO, Part
+from mrio_toolbox.utils.savers._to_nc import save_to_nc
+log = logging.getLogger(__name__)
+def extract_icio(year, source, destination, extended=False):
+    """
+    Extract and convert ICIO MRIO data to NetCDF format for use with mrio_toolbox.
+    This function loads ICIO tables and associated labels from raw OECD files,
+    processes them, and stores the result as a NetCDF file. It supports both
+    standard and extended ICIO formats (where China and Mexico are split).
+    Parameters
+    ----------
+    year : str
+        Year of the ICIO data to load (e.g., "2021").
+    source : path-like
+        Path to the folder containing the raw ICIO data and ReadMe Excel file.
+    extended : bool, optional
+        If True, loads the extended version of the ICIO tables (China and Mexico split).
+        If False (default), loads the standard version.
+    Notes
+    -----
+    - The ReadMe Excel file must be present in the same source folder as the xlsx data file.
+    - Output filenames are automatically generated based on the year and format.
+    """
+    #Check source path
+    if not os.path.exists(source):
+        log.error(f"{os.path.abspath(source)} does not exist.")
+        raise NotADirectoryError(f"{os.path.abspath(source)} does not exist.")
+    #Check destination path
+    if not os.path.exists(destination):
+        log.info(f"{os.path.abspath(
+            destination)} does not exist. Creating directory.")
+        os.makedirs(destination)
+    # Adapt the filenames based on the extended parameter
+    if extended:
+        readme_filename = os.path.join(source, "ReadMe_ICIO_extended.xlsx")
+        data_filename = os.path.join(source, f"{year}.csv")
+    else:
+        readme_filename = os.path.join(source,"ReadMe_ICIO_small.xlsx")
+        data_filename = os.path.join(source, f"{year}_SML.csv")
+    # Load the labels
+    countries = pd.read_excel(readme_filename, sheet_name='Area_Activities', header=2)['countries'].dropna().to_list()
+    # Filter out everything in parenthesis, such as the additional references (1) and (2) for Israel and Cyprus
+    # as well as (People's Republic of China) for China and (People's Democratic Republic) for Lao
+    countries = [country.split('(')[0].strip() for country in countries]
+    sectors = pd.read_excel(readme_filename, sheet_name='Area_Activities', header=2)['Industry'].dropna().to_list()
+    df = pd.read_excel(readme_filename, sheet_name='ColItems',header=3)
+    index = df[df["Sector code"] == "Final demand items"].index[0]
+    y_labs = df.iloc[index:,4].to_list()
+    va_labs = ["Taxes less subsidies on intermediate and final products", "Value added at basic prices"]
+    labels = {
+        "countries": countries,
+        "sectors": sectors,
+        "y_labs": y_labs,
+        "va_labs": va_labs
+    }
+    if extended:
+        countries_y = countries[:-4] # remove MX1, MX2, CN1, CN2
+        labels["countries_y"] = countries_y
+    # Extract the raw data
+    s,c = len(sectors),len(countries)
+    raw = pd.read_csv(data_filename, header=0,index_col=0).to_numpy()
+    tables = {}
+    tables["t"] = raw[:c*s,:c*s]
+    tables["y"] = raw[:c*s,c*s:-1] # last column is cumulative output
+    tables["va"] = raw[c*s:-1,:c*s]
+    tables["vay"] = raw[c*s:-1,c*s:-1]
+    # Build MRIO object
+    m = MRIO()
+    m.add_dimensions(labels)
+    m.parts["t"] = m.new_part(name="t", data= tables["t"],
+        dimensions = [["countries","sectors"],["countries", "sectors"]])
+    m.parts["va"] = m.new_part(name="va", data= tables["va"],
+        dimensions = ["va_labs",["countries", "sectors"]])
+    if extended:
+        m.parts["y"] = m.new_part(name="y", data= tables["y"],
+            dimensions = [["countries","sectors"],["countries_y", "y_labs"]])
+        m.parts["vay"] = m.new_part(name="vay", data= tables["vay"],
+            dimensions = ["va_labs",["countries_y", "y_labs"]])
+    else:
+         m.parts["y"] = m.new_part(name="y",data= tables["y"],
+            dimensions = [["countries","sectors"],["countries", "y_labs"]])
+         m.parts["vay"] = m.new_part(name="vay", data= tables["vay"],
+            dimensions = ["va_labs",["countries", "y_labs"]])
+    # Save the mrio object to a NetCDF file
+    if extended:
+        destination = os.path.join(destination, f"icio_year{year}_extended.nc")
+    else:
+        destination = os.path.join(destination, f"icio_year{year}.nc")
+    save_to_nc(m, destination, overwrite=False)

extractors/wiod/__init__.py ADDED Viewed

@@ -0,0 +1,3 @@
+"""
+This module contains the WIOD extractor.
+"""

extractors/wiod/wiod_extractor.py ADDED Viewed

@@ -0,0 +1,143 @@
+"""
+Extractor for WIOD 2016 files.
+This script extracts data from WIOD xlsb files and converts them to NetCDF files
+for further use with the MRIO toolbox.
+Supports WIOD 2016 in Excel format
+https://www.rug.nl/ggdc/valuechain/wiod/wiod-2016-release
+Created on 08.01, 2024
+@author: wirth, based on code of beaufils
+"""
+import os
+import logging
+import pandas as pd
+from mrio_toolbox import MRIO
+from mrio_toolbox.utils.savers._to_nc import save_to_nc
+log = logging.getLogger(__name__)
+def extract_wiod(
+    year,
+    source):
+    """
+    Extract WIOD data.
+    Loads WIOD tables and labels and store them as NetCDF for further use with
+    the mrio_toolbox library.
+    Parameters
+    ----------
+    year : str
+        Data year to load.
+    parts : str
+        Data blocks to load:
+            basic : T, Y
+            all : T, Y, VA, QT, QY
+    source : path-like
+        Path to folder where raw data is stored
+    """
+    #Check source path
+    if not os.path.exists(source):
+        log.error(f"{os.path.abspath(source)} does not exist.")
+        raise NotADirectoryError(f"{os.path.abspath(source)} does not exist.")
+    # WIOD 2016 comes with:
+    # - 43 countries + ROW
+    # - 56 sectors
+    # - 5 final demand categories
+    # - 6 value added category, including 5 tax categories
+    c,s,y,va = 44,56,5,6
+    log.info("Start loading")
+    tables = {}
+    raw = load_raw_WIOD(source, year)
+    countries, sectors, y_labs,  va_labs, = [],[],[],[]
+    labels = raw.columns
+    for i in range(c):
+        countries.append(labels[i*s][2].strip())
+    for i in range(s):
+        sectors.append(labels[i][1].strip())
+    for i in range(y):
+        y_labs.append(labels[s*c + i][1].strip())
+    for i in range(va):
+        va_labs.append(raw.index[s*c + 1 + i][1].strip())
+    raw = raw.to_numpy()
+    parts = ["t","y","va","vay"]
+    for part in parts:
+        if part == "t":
+            tables[part] = raw[:c*s,:c*s]
+        elif part == "y":
+            tables[part] = raw[:c*s,c*s:-1]
+        elif part == "va":
+            tables[part] = raw[c*s+1:-1,:c*s]
+        elif part == "vay":
+            tables[part] = raw[c*s+1:-1,c*s:-1]
+    # build an MRIO object from labels and tables
+    m = MRIO()
+    labels = {
+        "countries" : countries,
+        "sectors" : sectors,
+        "y_labs" : y_labs,
+        "va_labs" : va_labs, # including 5 tax categories
+        }
+    m.add_dimensions(labels)
+    m.parts["t"] = m.new_part(name="t",
+        data= tables["t"],
+        dimensions = [["countries","sectors"],["countries", "sectors"]])
+    m.parts["y"] = m.new_part(name="y",
+        data= tables["y"],
+        dimensions = [["countries","sectors"],["countries", "y_labs"]])
+    m.parts["va"] = m.new_part(name="va",
+        data= tables["va"],
+        dimensions = ["va_labs",["countries", "sectors"]])
+    m.parts["vay"] = m.new_part(name="vay",
+        data= tables["vay"],
+        dimensions = ["va_labs",["countries", "y_labs"]])
+    m.name = f"wiod16_{year}"
+    return m
+def load_raw_WIOD(path, year,release=16):
+    """
+    Load the raw WIOD matrix
+    Parameters
+    ----------
+    year : int-like
+    release : int-like, optional
+        Version of the WIOD database. The default is 2016.
+    Returns
+    -------
+    Pandas DataFrame
+        Full WIOD table as pandas DataFrame.
+    """
+    #Check source path
+    path = os.path.join(path, f'WIOT{year}_Nov{release}_ROW.xlsb')
+    if not os.path.exists(path):
+        log.error(f"{os.path.abspath(path)} does not exist.")
+        raise NotADirectoryError(f"{os.path.abspath(path)} does not exist.")
+    return pd.read_excel(path, header=[2,3,4,5],index_col=[0,1,2,3])
+if __name__ == "__main__":
+    extract_wiod(year=2014,
+                release=16,
+                source='/home/florian/job_merkator_institut/MRIO Projects/MRIOs/WIOD 2016 release',
+                destination="/home/florian/job_merkator_institut/MRIO Projects/MRIOs/netCDF objects")

mrio-toolbox 1.0.0__py3-none-any.whl → 1.1.2__py3-none-any.whl

Potentially problematic release.

mrio-toolbox 1.0.0py3-none-any.whl → 1.1.2py3-none-any.whl