PyPI - direl-ts-tool-kit - Versions diffs - 0.5.0__tar.gz → 0.6.0__tar.gz - Mend

direl-ts-tool-kit 0.5.0tar.gz → 0.6.0tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (16) hide show

{direl_ts_tool_kit-0.5.0 → direl_ts_tool_kit-0.6.0}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: direl-ts-tool-kit
-Version: 0.5.0
+Version: 0.6.0
 Summary: A toolbox for time series analysis and visualization.
 Home-page: https://gitlab.com/direl/direl_tool_kit
 Author: Diego Restrepo-Leal
@@ -89,6 +89,14 @@ This function automatically sets major and minor time-based locators
 on the x-axis based on the specified time unit, and formats the y-axis
 to use scientific notation.
+#### plot_interpolation_analysis
+`plot_interpolation_analysis(df_original, variable, units="", method="polynomial", order=2, imputation_se=None, time_unit="Year", rot=90)`
+Performs interpolation on missing data (NaNs) in a specified column and
+plots the result, highlighting the imputed points with confidence intervals
+if the Imputation Standard Error (SE) is provided.
 #### save_figure
 `save_figure(fig, file_name, variable_name="", path="./")`

{direl_ts_tool_kit-0.5.0 → direl_ts_tool_kit-0.6.0}/README.md RENAMED Viewed

@@ -56,6 +56,14 @@ This function automatically sets major and minor time-based locators
 on the x-axis based on the specified time unit, and formats the y-axis
 to use scientific notation.
+#### plot_interpolation_analysis
+`plot_interpolation_analysis(df_original, variable, units="", method="polynomial", order=2, imputation_se=None, time_unit="Year", rot=90)`
+Performs interpolation on missing data (NaNs) in a specified column and
+plots the result, highlighting the imputed points with confidence intervals
+if the Imputation Standard Error (SE) is provided.
 #### save_figure
 `save_figure(fig, file_name, variable_name="", path="./")`

{direl_ts_tool_kit-0.5.0 → direl_ts_tool_kit-0.6.0}/direl_ts_tool_kit/plot/plot_style.py RENAMED Viewed

@@ -1,6 +1,8 @@
 import seaborn as sns
 import matplotlib.pyplot as plt
 import matplotlib.dates as mdates
+from matplotlib.lines import Line2D
 plt.style.use("fast")

{direl_ts_tool_kit-0.5.0 → direl_ts_tool_kit-0.6.0}/direl_ts_tool_kit/plot/plot_ts.py RENAMED Viewed

@@ -1,3 +1,4 @@
+import numpy as np
 import pandas as pd
 from .plot_style import *
 from scipy.stats import pearsonr
@@ -121,6 +122,159 @@ def plot_time_series(
     return fig
+def plot_interpolation_analysis(
+    df_original,
+    variable,
+    units="",
+    method="polynomial",
+    order=2,
+    imputation_se=None,
+    time_unit="Year",
+    rot=90,
+):
+    """
+    Performs interpolation on missing data (NaNs) in a specified column and
+    plots the result, highlighting the imputed points with confidence intervals
+    if the Imputation Standard Error (SE) is provided.
+    Parameters
+    ----------
+    df_original : pd.DataFrame
+        The DataFrame containing the original time series data.
+    variable : str
+        The name of the column to interpolate and plot (e.g., 'LPUE').
+    units : str, optional
+        Units to display next to the variable name on the y-axis. Defaults to "".
+    method : str, optional
+        The interpolation method (e.g., 'linear', 'polynomial', 'spline').
+        Defaults to 'polynomial'.
+    order : int, optional
+        The order of the interpolation (required for 'polynomial' or 'spline').
+        Defaults to 2.
+    imputation_se : pd.Series, float, or None, optional
+        The Standard Error (SE) of the imputation. This must be a single value
+        or a Series aligned with the DataFrame's index. If None, confidence
+        intervals will NOT be plotted. Defaults to None.
+    time_unit : str, optional
+        The time granularity for x-axis tick locators. Defaults to "Year".
+    rot : int, optional
+        Rotation angle (in degrees) for the x-axis tick labels. Defaults to 90.
+    Returns
+    -------
+    matplotlib.figure.Figure
+        The generated Matplotlib figure object with the plot.
+    """
+    imputed_mask = df_original[variable].isnull()
+    df_interpolated = df_original.copy()
+    df_interpolated[variable] = df_interpolated[variable].interpolate(
+        method=method, order=order
+    )
+    color1 = paper_colors["RED_LINES"]
+    color2 = paper_colors["GREEN_LINES"]
+    col = np.where(imputed_mask, color1, color2)
+    fig, ax = plt.subplots()
+    if imputation_se is not None:
+        df_imputed_only = df_interpolated.copy()
+        df_imputed_only.loc[~imputed_mask, variable] = np.nan
+        Z_80 = 1.282
+        Z_95 = 1.96
+        error_80 = Z_80 * imputation_se
+        error_95 = Z_95 * imputation_se
+        ax.fill_between(
+            df_imputed_only.index,
+            df_imputed_only[variable] - error_95,
+            df_imputed_only[variable] + error_95,
+            color=paper_colors["GRAY_BARS"],
+            alpha=0.2,
+            edgecolor="none",
+            label="95% confidence interval",
+        )
+        ax.fill_between(
+            df_imputed_only.index,
+            df_imputed_only[variable] - error_80,
+            df_imputed_only[variable] + error_80,
+            color=paper_colors["GRAY_BARS"],
+            alpha=0.4,
+            edgecolor="none",
+            label="80% confidence interval",
+        )
+    ax.plot(
+        df_interpolated[variable],
+        linestyle="-.",
+        linewidth=1,
+        color=paper_colors["BLUE_LINES"],
+    )
+    ax.scatter(
+        df_interpolated.index,
+        df_interpolated[variable],
+        color=col,
+        s=10,
+        linewidth=4,
+    )
+    ax.set(xlabel=f"{time_unit}", ylabel=f"{variable} {units}")
+    ax.ticklabel_format(style="sci", axis="y", scilimits=(0, 0))
+    if time_unit == "Year":
+        ax.xaxis.set_major_locator(mdates.YearLocator())
+        ax.xaxis.set_minor_locator(mdates.MonthLocator())
+    if time_unit == "Month":
+        ax.xaxis.set_major_locator(mdates.MonthLocator())
+        ax.xaxis.set_minor_locator(mdates.WeekdayLocator())
+    if time_unit == "Weekday":
+        ax.xaxis.set_major_locator(mdates.WeekdayLocator())
+        ax.xaxis.set_minor_locator(mdates.DayLocator())
+    if time_unit == "Day":
+        ax.xaxis.set_major_locator(mdates.DayLocator())
+        ax.xaxis.set_minor_locator(mdates.HourLocator())
+    if time_unit == "Hour":
+        ax.xaxis.set_major_locator(mdates.HourLocator())
+        ax.xaxis.set_minor_locator(mdates.MinuteLocator())
+    ax.tick_params(axis="x", rotation=rot)
+    ax.grid(which="both")
+    ax.grid(which="minor", alpha=0.6, linestyle=":")
+    ax.grid(which="major", alpha=0.8, linestyle="--")
+    legend_elements = [
+        Line2D(
+            [0],
+            [0],
+            marker="o",
+            color=color2,
+            label="Current data",
+            linestyle="none",
+        ),
+        Line2D(
+            [0],
+            [0],
+            marker="o",
+            color=color1,
+            label="Imputed data",
+            linestyle="none",
+        ),
+    ]
+    ax.legend(handles=legend_elements, loc="upper right")
+    return fig
 def save_figure(
     fig,
     file_name,

{direl_ts_tool_kit-0.5.0 → direl_ts_tool_kit-0.6.0}/direl_ts_tool_kit.egg-info/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: direl-ts-tool-kit
-Version: 0.5.0
+Version: 0.6.0
 Summary: A toolbox for time series analysis and visualization.
 Home-page: https://gitlab.com/direl/direl_tool_kit
 Author: Diego Restrepo-Leal
@@ -89,6 +89,14 @@ This function automatically sets major and minor time-based locators
 on the x-axis based on the specified time unit, and formats the y-axis
 to use scientific notation.
+#### plot_interpolation_analysis
+`plot_interpolation_analysis(df_original, variable, units="", method="polynomial", order=2, imputation_se=None, time_unit="Year", rot=90)`
+Performs interpolation on missing data (NaNs) in a specified column and
+plots the result, highlighting the imputed points with confidence intervals
+if the Imputation Standard Error (SE) is provided.
 #### save_figure
 `save_figure(fig, file_name, variable_name="", path="./")`

{direl_ts_tool_kit-0.5.0 → direl_ts_tool_kit-0.6.0}/setup.py RENAMED Viewed

@@ -2,7 +2,7 @@ from setuptools import setup, find_packages
 setup(
     name="direl-ts-tool-kit",
-    version="0.5.0",
+    version="0.6.0",
     description="A toolbox for time series analysis and visualization.",
     long_description=open("README.md", encoding="utf-8").read(),
     long_description_content_type="text/markdown",