PyPI - tscli-darts - Versions diffs - 0.1.0__py3-none-any.whl - Mend

tscli-darts 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

tscli/__init__.py +5 -0
tscli/__main__.py +5 -0
tscli/analysis.py +63 -0
tscli/data.py +64 -0
tscli/forecasting.py +531 -0
tscli/main.py +422 -0
tscli/preprocessing.py +113 -0
tscli_darts-0.1.0.dist-info/METADATA +204 -0
tscli_darts-0.1.0.dist-info/RECORD +12 -0
tscli_darts-0.1.0.dist-info/WHEEL +5 -0
tscli_darts-0.1.0.dist-info/entry_points.txt +2 -0
tscli_darts-0.1.0.dist-info/top_level.txt +1 -0

tscli/__init__.py ADDED Viewed

@@ -0,0 +1,5 @@
+"""tscli package."""
+__all__ = ["__version__"]
+__version__ = "0.1.0"

tscli/__main__.py ADDED Viewed

@@ -0,0 +1,5 @@
+from tscli.main import main
+if __name__ == "__main__":
+    main()

tscli/analysis.py ADDED Viewed

@@ -0,0 +1,63 @@
+from __future__ import annotations
+from dataclasses import dataclass
+import pandas as pd
+from tscli.data import LoadedSeries
+@dataclass
+class SeriesSummary:
+    row_count: int
+    start: str
+    end: str
+    missing_target: int
+    mean: float
+    median: float
+    minimum: float
+    maximum: float
+    std_dev: float
+    inferred_frequency: str
+    trend_direction: str
+def summarize_series(dataset: LoadedSeries) -> SeriesSummary:
+    frame = dataset.frame.copy()
+    target = frame[dataset.target_col]
+    inferred_frequency = "not available"
+    if dataset.time_col != "__index__":
+        inferred = pd.infer_freq(frame[dataset.time_col])
+        if inferred:
+            inferred_frequency = inferred
+    clean_target = target.dropna()
+    if clean_target.empty:
+        raise ValueError("The target series is empty after dropping missing values.")
+    trend_delta = clean_target.iloc[-1] - clean_target.iloc[0]
+    if trend_delta > 0:
+        trend_direction = "upward"
+    elif trend_delta < 0:
+        trend_direction = "downward"
+    else:
+        trend_direction = "flat"
+    return SeriesSummary(
+        row_count=len(frame),
+        start=str(frame[dataset.time_col].iloc[0]),
+        end=str(frame[dataset.time_col].iloc[-1]),
+        missing_target=int(target.isna().sum()),
+        mean=float(clean_target.mean()),
+        median=float(clean_target.median()),
+        minimum=float(clean_target.min()),
+        maximum=float(clean_target.max()),
+        std_dev=float(clean_target.std(ddof=0)),
+        inferred_frequency=inferred_frequency,
+        trend_direction=trend_direction,
+    )
+def recent_observations(dataset: LoadedSeries, rows: int = 5) -> pd.DataFrame:
+    return dataset.frame[[dataset.time_col, dataset.target_col]].tail(rows).copy()

tscli/data.py ADDED Viewed

@@ -0,0 +1,64 @@
+from __future__ import annotations
+from dataclasses import dataclass
+from pathlib import Path
+import pandas as pd
+from tscli.preprocessing import (
+    PreprocessingReport,
+    clean_numeric_column,
+    finalize_time_series,
+    normalize_columns,
+    parse_time_column,
+)
+@dataclass
+class LoadedSeries:
+    source: Path
+    frame: pd.DataFrame
+    time_col: str
+    target_col: str
+    report: PreprocessingReport
+def load_csv(csv_path: Path, time_col: str | None, target_col: str) -> LoadedSeries:
+    frame = pd.read_csv(csv_path)
+    report = PreprocessingReport()
+    frame = normalize_columns(frame, report)
+    if target_col not in frame.columns:
+        raise ValueError(f"Target column '{target_col}' was not found in the CSV.")
+    resolved_time_col = time_col
+    if resolved_time_col is None:
+        for candidate in ("date", "datetime", "timestamp", "ds", "time"):
+            if candidate in frame.columns:
+                resolved_time_col = candidate
+                break
+    if resolved_time_col is not None:
+        if resolved_time_col not in frame.columns:
+            raise ValueError(f"Time column '{resolved_time_col}' was not found in the CSV.")
+        frame = parse_time_column(frame, resolved_time_col, report)
+        if frame[resolved_time_col].isna().any():
+            raise ValueError(
+                f"Time column '{resolved_time_col}' contains values that could not be parsed as datetime."
+            )
+    else:
+        resolved_time_col = "__index__"
+        frame[resolved_time_col] = pd.RangeIndex(start=0, stop=len(frame), step=1)
+        report.add_fix("Created a synthetic integer time index because no time column was provided.")
+    frame = clean_numeric_column(frame, target_col, report)
+    if frame[target_col].isna().all():
+        raise ValueError(f"Target column '{target_col}' does not contain numeric values.")
+    frame = finalize_time_series(frame, resolved_time_col, target_col, report)
+    return LoadedSeries(
+        source=csv_path,
+        frame=frame,
+        time_col=resolved_time_col,
+        target_col=target_col,
+        report=report,
+    )

tscli/forecasting.py ADDED Viewed

@@ -0,0 +1,531 @@
+from __future__ import annotations
+from dataclasses import dataclass
+from importlib import import_module
+from pathlib import Path
+from typing import Any
+import matplotlib.pyplot as plt
+import numpy as np
+import pandas as pd
+from darts import TimeSeries
+from statsmodels.tsa.arima.model import ARIMA as StatsmodelsARIMA
+from statsmodels.tsa.statespace.sarimax import SARIMAX
+from tqdm import tqdm
+from tscli.data import LoadedSeries
+@dataclass(frozen=True)
+class ModelSpec:
+    description: str
+    family: str
+MODEL_SPECS = {
+    "naive-last": ModelSpec("Repeats the last observed value.", "built-in"),
+    "naive-drift": ModelSpec("Extends the line from the first to the last observation.", "built-in"),
+    "naive-seasonal": ModelSpec("Repeats the last seasonal pattern.", "built-in"),
+    "moving-average": ModelSpec("Forecasts with the mean of the latest seasonal window.", "built-in"),
+    "weighted-moving-average": ModelSpec(
+        "Forecasts with a linearly weighted average of the latest seasonal window.", "built-in"
+    ),
+    "exp-smoothing": ModelSpec("Forecasts with an exponentially weighted moving average level.", "built-in"),
+    "seasonal-average": ModelSpec(
+        "Forecasts each seasonal position with the average of past matching positions.", "built-in"
+    ),
+    "seasonal-median": ModelSpec(
+        "Forecasts each seasonal position with the median of past matching positions.", "built-in"
+    ),
+    "linear-trend": ModelSpec("Fits a straight trend line across the series.", "built-in"),
+    "quadratic-trend": ModelSpec("Fits a quadratic trend curve across the series.", "built-in"),
+    "arima": ModelSpec("DARTS ARIMA model for classical forecasting.", "darts-classical"),
+    "theta": ModelSpec("DARTS Theta model for classical univariate forecasting.", "darts-classical"),
+    "exponential-smoothing": ModelSpec(
+        "DARTS ExponentialSmoothing model for level, trend, and seasonality.", "darts-classical"
+    ),
+    "auto-arima": ModelSpec("DARTS AutoARIMA model with automatic order selection.", "darts-classical"),
+    "sarima": ModelSpec("DARTS ARIMA model configured with seasonal ARIMA defaults.", "darts-classical"),
+}
+SUPPORTED_MODELS = {name: spec.description for name, spec in MODEL_SPECS.items()}
+@dataclass
+class ForecastResult:
+    model_name: str
+    forecast_frame: pd.DataFrame
+@dataclass
+class EvaluationResult:
+    model_name: str
+    mae: float
+    rmse: float
+    mape: float
+@dataclass
+class BenchmarkResult:
+    scores: list[EvaluationResult]
+    actual_frame: pd.DataFrame
+    forecasts: dict[str, pd.DataFrame]
+    best_model: str
+    skipped_models: dict[str, str]
+def build_series(dataset: LoadedSeries) -> TimeSeries:
+    frame = dataset.frame[[dataset.time_col, dataset.target_col]].dropna().copy()
+    if dataset.time_col == "__index__":
+        frame[dataset.time_col] = pd.RangeIndex(start=0, stop=len(frame), step=1)
+        return TimeSeries.from_dataframe(
+            frame,
+            time_col=dataset.time_col,
+            value_cols=dataset.target_col,
+        )
+    return TimeSeries.from_dataframe(
+        frame,
+        time_col=dataset.time_col,
+        value_cols=dataset.target_col,
+        fill_missing_dates=False,
+    )
+def _future_index(frame: pd.DataFrame, time_col: str, horizon: int) -> pd.Index:
+    if time_col == "__index__":
+        start = int(frame[time_col].iloc[-1]) + 1
+        return pd.RangeIndex(start=start, stop=start + horizon, step=1)
+    inferred = pd.infer_freq(frame[time_col])
+    if inferred:
+        offset = pd.tseries.frequencies.to_offset(inferred)
+        start = frame[time_col].iloc[-1] + offset
+        return pd.date_range(start=start, periods=horizon, freq=offset)
+    if len(frame) >= 2:
+        delta = frame[time_col].iloc[-1] - frame[time_col].iloc[-2]
+    else:
+        delta = pd.Timedelta(days=1)
+    start = frame[time_col].iloc[-1] + delta
+    return pd.Index([start + delta * step for step in range(horizon)])
+def _coerce_output_frame(frame: pd.DataFrame, time_col: str) -> pd.DataFrame:
+    export = frame.copy()
+    if time_col != "__index__" and pd.api.types.is_datetime64_any_dtype(export[time_col]):
+        export[time_col] = export[time_col].dt.strftime("%Y-%m-%d")
+    return export
+def _dataset_from_frame(dataset: LoadedSeries, frame: pd.DataFrame) -> LoadedSeries:
+    return LoadedSeries(
+        source=dataset.source,
+        frame=frame.reset_index(drop=True),
+        time_col=dataset.time_col,
+        target_col=dataset.target_col,
+        report=dataset.report,
+    )
+def _load_optional_model(model_name: str) -> Any:
+    loaders = {
+        "arima": ("darts.models.forecasting.arima", "ARIMA"),
+        "theta": ("darts.models.forecasting.theta", "Theta"),
+        "exponential-smoothing": ("darts.models.forecasting.exponential_smoothing", "ExponentialSmoothing"),
+        "auto-arima": ("darts.models.forecasting.sf_auto_arima", "AutoARIMA"),
+        "sarima": ("darts.models.forecasting.arima", "ARIMA"),
+    }
+    module_name, class_name = loaders[model_name]
+    try:
+        module = import_module(module_name)
+        return getattr(module, class_name)
+    except Exception as exc:  # pragma: no cover - environment dependent
+        extra_hint = "Install tscli with the right optional extra."
+        if model_name in {"arima", "theta", "exponential-smoothing", "sarima"}:
+            extra_hint = "Install tscli with the 'classical' extra: pip install -e .[classical]"
+        elif model_name == "auto-arima":
+            extra_hint = (
+                "Install tscli with the 'autoarima' extra, or 'full' for everything: "
+                "pip install -e .[autoarima]"
+            )
+        raise ValueError(
+            f"Model '{model_name}' is unavailable in this environment. {extra_hint}. "
+            f"Original error: {exc}"
+        ) from exc
+def _heuristic_forecast_values(
+    history: np.ndarray,
+    model_name: str,
+    horizon: int,
+    seasonal_period: int,
+) -> np.ndarray:
+    if len(history) == 0:
+        raise ValueError("The target series is empty after dropping missing values.")
+    if model_name == "naive-last":
+        return np.repeat(history[-1], horizon)
+    if model_name == "naive-drift":
+        if len(history) == 1:
+            return np.repeat(history[-1], horizon)
+        slope = (history[-1] - history[0]) / (len(history) - 1)
+        return np.array([history[-1] + slope * step for step in range(1, horizon + 1)])
+    if model_name == "naive-seasonal":
+        if len(history) < seasonal_period:
+            raise ValueError(
+                f"Naive seasonal needs at least {seasonal_period} observations, but found {len(history)}."
+            )
+        pattern = history[-seasonal_period:]
+        return np.array([pattern[step % seasonal_period] for step in range(horizon)])
+    if model_name == "moving-average":
+        window = min(seasonal_period, len(history))
+        average = float(np.mean(history[-window:]))
+        return np.repeat(average, horizon)
+    if model_name == "weighted-moving-average":
+        window = min(seasonal_period, len(history))
+        weights = np.arange(1, window + 1, dtype=float)
+        average = float(np.average(history[-window:], weights=weights))
+        return np.repeat(average, horizon)
+    if model_name == "exp-smoothing":
+        span = max(2, min(seasonal_period, len(history)))
+        level = float(pd.Series(history).ewm(span=span, adjust=False).mean().iloc[-1])
+        return np.repeat(level, horizon)
+    if model_name == "seasonal-average":
+        if len(history) < seasonal_period:
+            raise ValueError(
+                f"Seasonal average needs at least {seasonal_period} observations, but found {len(history)}."
+            )
+        values = []
+        for step in range(horizon):
+            position = step % seasonal_period
+            seasonal_slice = history[position::seasonal_period]
+            values.append(float(np.mean(seasonal_slice)))
+        return np.array(values)
+    if model_name == "seasonal-median":
+        if len(history) < seasonal_period:
+            raise ValueError(
+                f"Seasonal median needs at least {seasonal_period} observations, but found {len(history)}."
+            )
+        values = []
+        for step in range(horizon):
+            position = step % seasonal_period
+            seasonal_slice = history[position::seasonal_period]
+            values.append(float(np.median(seasonal_slice)))
+        return np.array(values)
+    if model_name == "quadratic-trend":
+        if len(history) < 3:
+            raise ValueError("Quadratic trend needs at least 3 observations.")
+        x = np.arange(len(history), dtype=float)
+        a, b, c = np.polyfit(x, history.astype(float), 2)
+        future_x = np.arange(len(history), len(history) + horizon, dtype=float)
+        return a * np.square(future_x) + b * future_x + c
+    x = np.arange(len(history), dtype=float)
+    slope, intercept = np.polyfit(x, history.astype(float), 1)
+    future_x = np.arange(len(history), len(history) + horizon, dtype=float)
+    return intercept + slope * future_x
+def _darts_classical_forecast(
+    dataset: LoadedSeries,
+    model_name: str,
+    horizon: int,
+    seasonal_period: int,
+) -> pd.DataFrame:
+    series = build_series(dataset)
+    model_class = _load_optional_model(model_name)
+    if model_name == "theta":
+        model = model_class()
+    elif model_name == "exponential-smoothing":
+        kwargs: dict[str, Any] = {}
+        if len(series) >= seasonal_period * 2:
+            kwargs["seasonal_periods"] = seasonal_period
+        model = model_class(**kwargs)
+    elif model_name == "auto-arima":
+        kwargs = {}
+        if len(series) >= seasonal_period * 2:
+            kwargs["season_length"] = seasonal_period
+        model = model_class(**kwargs)
+    elif model_name == "sarima":
+        kwargs = {"p": 1, "d": 1, "q": 1}
+        if len(series) >= seasonal_period * 2:
+            kwargs["seasonal_order"] = (1, 1, 1, seasonal_period)
+        model = model_class(**kwargs)
+    else:
+        model = model_class(p=1, d=1, q=1)
+    try:
+        model.fit(series)
+        forecast = model.predict(horizon)
+    except Exception as exc:  # pragma: no cover - environment dependent
+        raise ValueError(f"Model '{model_name}' failed to fit or predict. Original error: {exc}") from exc
+    try:
+        if hasattr(forecast, "pd_dataframe"):
+            forecast_frame = forecast.pd_dataframe().reset_index()
+        elif hasattr(forecast, "to_dataframe"):
+            forecast_frame = forecast.to_dataframe().reset_index()
+        elif hasattr(forecast, "pd_series"):
+            forecast_frame = forecast.pd_series().to_frame(name=dataset.target_col).reset_index()
+        else:
+            raise AttributeError("No supported dataframe conversion method was found on the DARTS TimeSeries result.")
+    except Exception as exc:  # pragma: no cover - environment dependent
+        raise ValueError(
+            f"Model '{model_name}' produced a forecast, but tscli could not convert it to a table. "
+            f"Original error: {exc}"
+        ) from exc
+    forecast_frame.columns = [dataset.time_col, dataset.target_col]
+    return forecast_frame
+def _statsmodels_fallback_forecast(
+    dataset: LoadedSeries,
+    model_name: str,
+    horizon: int,
+    seasonal_period: int,
+) -> pd.DataFrame:
+    frame = dataset.frame[[dataset.time_col, dataset.target_col]].dropna().copy()
+    history = frame[dataset.target_col].astype(float).to_numpy()
+    try:
+        if model_name == "arima":
+            fitted = StatsmodelsARIMA(history, order=(1, 1, 1)).fit()
+        else:
+            seasonal_order = (1, 1, 1, seasonal_period)
+            if len(history) < max(24, seasonal_period * 2 + 6):
+                seasonal_order = (0, 1, 1, seasonal_period)
+            fitted = SARIMAX(
+                history,
+                order=(1, 1, 1),
+                seasonal_order=seasonal_order,
+                enforce_stationarity=False,
+                enforce_invertibility=False,
+            ).fit(disp=False)
+        forecast_values = np.asarray(fitted.forecast(steps=horizon), dtype=float)
+    except Exception as exc:
+        raise ValueError(
+            f"Model '{model_name}' is unavailable through DARTS and the fallback implementation also failed. "
+            f"Original error: {exc}"
+        ) from exc
+    return pd.DataFrame(
+        {
+            dataset.time_col: _future_index(frame, dataset.time_col, horizon),
+            dataset.target_col: forecast_values,
+        }
+    )
+def _statsmodels_classical_forecast(
+    dataset: LoadedSeries,
+    model_name: str,
+    horizon: int,
+    seasonal_period: int,
+) -> pd.DataFrame:
+    frame = dataset.frame[[dataset.time_col, dataset.target_col]].dropna().copy()
+    history = frame[dataset.target_col].astype(float).to_numpy()
+    try:
+        if model_name == "arima":
+            fitted = StatsmodelsARIMA(history, order=(1, 1, 1)).fit()
+        else:
+            seasonal_order = (1, 1, 1, seasonal_period)
+            # Small datasets often cannot support a full seasonal parameterization.
+            if len(history) < max(24, seasonal_period * 2 + 6):
+                seasonal_order = (0, 1, 1, seasonal_period)
+            fitted = SARIMAX(
+                history,
+                order=(1, 1, 1),
+                seasonal_order=seasonal_order,
+                enforce_stationarity=False,
+                enforce_invertibility=False,
+            ).fit(disp=False)
+        forecast_values = np.asarray(fitted.forecast(steps=horizon), dtype=float)
+    except Exception as exc:
+        raise ValueError(f"Model '{model_name}' failed to fit or predict. Original error: {exc}") from exc
+    forecast_frame = pd.DataFrame(
+        {
+            dataset.time_col: _future_index(frame, dataset.time_col, horizon),
+            dataset.target_col: forecast_values,
+        }
+    )
+    return forecast_frame
+def generate_forecast(
+    dataset: LoadedSeries,
+    model_name: str,
+    horizon: int,
+    seasonal_period: int = 12,
+) -> ForecastResult:
+    if model_name not in SUPPORTED_MODELS:
+        allowed = ", ".join(sorted(SUPPORTED_MODELS))
+        raise ValueError(f"Unsupported model '{model_name}'. Choose from: {allowed}.")
+    frame = dataset.frame[[dataset.time_col, dataset.target_col]].dropna().copy()
+    family = MODEL_SPECS[model_name].family
+    if family == "built-in":
+        series = build_series(dataset)
+        history = series.values(copy=False).reshape(-1)
+        forecast_values = _heuristic_forecast_values(history, model_name, horizon, seasonal_period)
+        forecast_frame = pd.DataFrame(
+            {
+                dataset.time_col: _future_index(frame, dataset.time_col, horizon),
+                dataset.target_col: forecast_values,
+            }
+        )
+    else:
+        try:
+            forecast_frame = _darts_classical_forecast(dataset, model_name, horizon, seasonal_period)
+        except ValueError as exc:
+            if model_name in {"arima", "sarima"} and "unavailable in this environment" in str(exc):
+                forecast_frame = _statsmodels_fallback_forecast(dataset, model_name, horizon, seasonal_period)
+            else:
+                raise
+    return ForecastResult(model_name=model_name, forecast_frame=forecast_frame)
+def evaluate_forecast(actual: np.ndarray, predicted: np.ndarray, model_name: str) -> EvaluationResult:
+    actual = actual.astype(float)
+    predicted = predicted.astype(float)
+    errors = actual - predicted
+    mae = float(np.mean(np.abs(errors)))
+    rmse = float(np.sqrt(np.mean(np.square(errors))))
+    non_zero_mask = actual != 0
+    if non_zero_mask.any():
+        mape = float(np.mean(np.abs(errors[non_zero_mask] / actual[non_zero_mask])) * 100)
+    else:
+        mape = float("nan")
+    return EvaluationResult(model_name=model_name, mae=mae, rmse=rmse, mape=mape)
+def benchmark_models(
+    dataset: LoadedSeries,
+    model_names: list[str],
+    horizon: int,
+    seasonal_period: int = 12,
+) -> BenchmarkResult:
+    clean_frame = dataset.frame[[dataset.time_col, dataset.target_col]].dropna().reset_index(drop=True)
+    if len(clean_frame) <= horizon:
+        raise ValueError(
+            f"Need more than {horizon} observations to benchmark models, but found {len(clean_frame)}."
+        )
+    train_frame = clean_frame.iloc[:-horizon].copy()
+    actual_frame = clean_frame.iloc[-horizon:].copy().reset_index(drop=True)
+    train_dataset = _dataset_from_frame(dataset, train_frame)
+    scores: list[EvaluationResult] = []
+    forecasts: dict[str, pd.DataFrame] = {}
+    skipped_models: dict[str, str] = {}
+    for model_name in tqdm(model_names, desc="Benchmarking models", unit="model"):
+        try:
+            result = generate_forecast(
+                train_dataset,
+                model_name=model_name,
+                horizon=horizon,
+                seasonal_period=seasonal_period,
+            )
+            predicted = result.forecast_frame[dataset.target_col].to_numpy(dtype=float)
+            actual = actual_frame[dataset.target_col].to_numpy(dtype=float)
+            scores.append(evaluate_forecast(actual, predicted, model_name))
+            forecasts[model_name] = result.forecast_frame
+        except Exception as exc:
+            skipped_models[model_name] = str(exc)
+    if not scores:
+        raise ValueError("No models could be benchmarked successfully with the current data and settings.")
+    scores.sort(key=lambda item: (item.rmse, item.mae, item.model_name))
+    return BenchmarkResult(
+        scores=scores,
+        actual_frame=actual_frame,
+        forecasts=forecasts,
+        best_model=scores[0].model_name,
+        skipped_models=skipped_models,
+    )
+def export_frame(frame: pd.DataFrame, output_path: Path, time_col: str) -> None:
+    export = _coerce_output_frame(frame, time_col)
+    output_path.parent.mkdir(parents=True, exist_ok=True)
+    export.to_csv(output_path, index=False)
+def export_scores(scores: list[EvaluationResult], output_path: Path) -> None:
+    output_path.parent.mkdir(parents=True, exist_ok=True)
+    score_frame = pd.DataFrame(
+        [
+            {
+                "model": score.model_name,
+                "mae": score.mae,
+                "rmse": score.rmse,
+                "mape": score.mape,
+            }
+            for score in scores
+        ]
+    )
+    score_frame.to_csv(output_path, index=False)
+def export_forecast_plot(
+    history_frame: pd.DataFrame,
+    forecast_frame: pd.DataFrame,
+    time_col: str,
+    target_col: str,
+    output_path: Path,
+    model_name: str,
+) -> None:
+    output_path.parent.mkdir(parents=True, exist_ok=True)
+    fig, ax = plt.subplots(figsize=(10, 5))
+    ax.plot(history_frame[time_col], history_frame[target_col], label="history", linewidth=2)
+    ax.plot(forecast_frame[time_col], forecast_frame[target_col], label=f"forecast ({model_name})", linewidth=2)
+    ax.set_title(f"Forecast - {model_name}")
+    ax.set_xlabel(time_col)
+    ax.set_ylabel(target_col)
+    ax.legend()
+    ax.grid(alpha=0.3)
+    fig.autofmt_xdate()
+    fig.tight_layout()
+    fig.savefig(output_path, dpi=160)
+    plt.close(fig)
+def export_benchmark_plot(
+    actual_frame: pd.DataFrame,
+    forecast_frame: pd.DataFrame,
+    time_col: str,
+    target_col: str,
+    output_path: Path,
+    model_name: str,
+) -> None:
+    output_path.parent.mkdir(parents=True, exist_ok=True)
+    fig, ax = plt.subplots(figsize=(10, 5))
+    ax.plot(actual_frame[time_col], actual_frame[target_col], label="actual", linewidth=2)
+    ax.plot(forecast_frame[time_col], forecast_frame[target_col], label=f"predicted ({model_name})", linewidth=2)
+    ax.set_title(f"Benchmark Holdout - {model_name}")
+    ax.set_xlabel(time_col)
+    ax.set_ylabel(target_col)
+    ax.legend()
+    ax.grid(alpha=0.3)
+    fig.autofmt_xdate()
+    fig.tight_layout()
+    fig.savefig(output_path, dpi=160)
+    plt.close(fig)