PyPI - ml4t-diagnostic - Versions diffs - 0.1.0a1__py3-none-any.whl - Mend

ml4t-diagnostic 0.1.0a1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (242) hide show

ml4t/diagnostic/AGENT.md +25 -0
ml4t/diagnostic/__init__.py +166 -0
ml4t/diagnostic/backends/__init__.py +10 -0
ml4t/diagnostic/backends/adapter.py +192 -0
ml4t/diagnostic/backends/polars_backend.py +899 -0
ml4t/diagnostic/caching/__init__.py +40 -0
ml4t/diagnostic/caching/cache.py +331 -0
ml4t/diagnostic/caching/decorators.py +131 -0
ml4t/diagnostic/caching/smart_cache.py +339 -0
ml4t/diagnostic/config/AGENT.md +24 -0
ml4t/diagnostic/config/README.md +267 -0
ml4t/diagnostic/config/__init__.py +219 -0
ml4t/diagnostic/config/barrier_config.py +277 -0
ml4t/diagnostic/config/base.py +301 -0
ml4t/diagnostic/config/event_config.py +148 -0
ml4t/diagnostic/config/feature_config.py +404 -0
ml4t/diagnostic/config/multi_signal_config.py +55 -0
ml4t/diagnostic/config/portfolio_config.py +215 -0
ml4t/diagnostic/config/report_config.py +391 -0
ml4t/diagnostic/config/sharpe_config.py +202 -0
ml4t/diagnostic/config/signal_config.py +206 -0
ml4t/diagnostic/config/trade_analysis_config.py +310 -0
ml4t/diagnostic/config/validation.py +279 -0
ml4t/diagnostic/core/__init__.py +29 -0
ml4t/diagnostic/core/numba_utils.py +315 -0
ml4t/diagnostic/core/purging.py +372 -0
ml4t/diagnostic/core/sampling.py +471 -0
ml4t/diagnostic/errors/__init__.py +205 -0
ml4t/diagnostic/evaluation/AGENT.md +26 -0
ml4t/diagnostic/evaluation/__init__.py +437 -0
ml4t/diagnostic/evaluation/autocorrelation.py +531 -0
ml4t/diagnostic/evaluation/barrier_analysis.py +1050 -0
ml4t/diagnostic/evaluation/binary_metrics.py +910 -0
ml4t/diagnostic/evaluation/dashboard.py +715 -0
ml4t/diagnostic/evaluation/diagnostic_plots.py +1037 -0
ml4t/diagnostic/evaluation/distribution/__init__.py +499 -0
ml4t/diagnostic/evaluation/distribution/moments.py +299 -0
ml4t/diagnostic/evaluation/distribution/tails.py +777 -0
ml4t/diagnostic/evaluation/distribution/tests.py +470 -0
ml4t/diagnostic/evaluation/drift/__init__.py +139 -0
ml4t/diagnostic/evaluation/drift/analysis.py +432 -0
ml4t/diagnostic/evaluation/drift/domain_classifier.py +517 -0
ml4t/diagnostic/evaluation/drift/population_stability_index.py +310 -0
ml4t/diagnostic/evaluation/drift/wasserstein.py +388 -0
ml4t/diagnostic/evaluation/event_analysis.py +647 -0
ml4t/diagnostic/evaluation/excursion.py +390 -0
ml4t/diagnostic/evaluation/feature_diagnostics.py +873 -0
ml4t/diagnostic/evaluation/feature_outcome.py +666 -0
ml4t/diagnostic/evaluation/framework.py +935 -0
ml4t/diagnostic/evaluation/metric_registry.py +255 -0
ml4t/diagnostic/evaluation/metrics/AGENT.md +23 -0
ml4t/diagnostic/evaluation/metrics/__init__.py +133 -0
ml4t/diagnostic/evaluation/metrics/basic.py +160 -0
ml4t/diagnostic/evaluation/metrics/conditional_ic.py +469 -0
ml4t/diagnostic/evaluation/metrics/feature_outcome.py +475 -0
ml4t/diagnostic/evaluation/metrics/ic_statistics.py +446 -0
ml4t/diagnostic/evaluation/metrics/importance_analysis.py +338 -0
ml4t/diagnostic/evaluation/metrics/importance_classical.py +375 -0
ml4t/diagnostic/evaluation/metrics/importance_mda.py +371 -0
ml4t/diagnostic/evaluation/metrics/importance_shap.py +715 -0
ml4t/diagnostic/evaluation/metrics/information_coefficient.py +527 -0
ml4t/diagnostic/evaluation/metrics/interactions.py +772 -0
ml4t/diagnostic/evaluation/metrics/monotonicity.py +226 -0
ml4t/diagnostic/evaluation/metrics/risk_adjusted.py +324 -0
ml4t/diagnostic/evaluation/multi_signal.py +550 -0
ml4t/diagnostic/evaluation/portfolio_analysis/__init__.py +83 -0
ml4t/diagnostic/evaluation/portfolio_analysis/analysis.py +734 -0
ml4t/diagnostic/evaluation/portfolio_analysis/metrics.py +589 -0
ml4t/diagnostic/evaluation/portfolio_analysis/results.py +334 -0
ml4t/diagnostic/evaluation/report_generation.py +824 -0
ml4t/diagnostic/evaluation/signal_selector.py +452 -0
ml4t/diagnostic/evaluation/stat_registry.py +139 -0
ml4t/diagnostic/evaluation/stationarity/__init__.py +97 -0
ml4t/diagnostic/evaluation/stationarity/analysis.py +518 -0
ml4t/diagnostic/evaluation/stationarity/augmented_dickey_fuller.py +296 -0
ml4t/diagnostic/evaluation/stationarity/kpss_test.py +308 -0
ml4t/diagnostic/evaluation/stationarity/phillips_perron.py +365 -0
ml4t/diagnostic/evaluation/stats/AGENT.md +43 -0
ml4t/diagnostic/evaluation/stats/__init__.py +191 -0
ml4t/diagnostic/evaluation/stats/backtest_overfitting.py +219 -0
ml4t/diagnostic/evaluation/stats/bootstrap.py +228 -0
ml4t/diagnostic/evaluation/stats/deflated_sharpe_ratio.py +591 -0
ml4t/diagnostic/evaluation/stats/false_discovery_rate.py +295 -0
ml4t/diagnostic/evaluation/stats/hac_standard_errors.py +108 -0
ml4t/diagnostic/evaluation/stats/minimum_track_record.py +408 -0
ml4t/diagnostic/evaluation/stats/moments.py +164 -0
ml4t/diagnostic/evaluation/stats/rademacher_adjustment.py +436 -0
ml4t/diagnostic/evaluation/stats/reality_check.py +155 -0
ml4t/diagnostic/evaluation/stats/sharpe_inference.py +219 -0
ml4t/diagnostic/evaluation/themes.py +330 -0
ml4t/diagnostic/evaluation/threshold_analysis.py +957 -0
ml4t/diagnostic/evaluation/trade_analysis.py +1136 -0
ml4t/diagnostic/evaluation/trade_dashboard/__init__.py +32 -0
ml4t/diagnostic/evaluation/trade_dashboard/app.py +315 -0
ml4t/diagnostic/evaluation/trade_dashboard/export/__init__.py +18 -0
ml4t/diagnostic/evaluation/trade_dashboard/export/csv.py +82 -0
ml4t/diagnostic/evaluation/trade_dashboard/export/html.py +276 -0
ml4t/diagnostic/evaluation/trade_dashboard/io.py +166 -0
ml4t/diagnostic/evaluation/trade_dashboard/normalize.py +304 -0
ml4t/diagnostic/evaluation/trade_dashboard/stats.py +386 -0
ml4t/diagnostic/evaluation/trade_dashboard/style.py +79 -0
ml4t/diagnostic/evaluation/trade_dashboard/tabs/__init__.py +21 -0
ml4t/diagnostic/evaluation/trade_dashboard/tabs/patterns.py +354 -0
ml4t/diagnostic/evaluation/trade_dashboard/tabs/shap_analysis.py +280 -0
ml4t/diagnostic/evaluation/trade_dashboard/tabs/stat_validation.py +186 -0
ml4t/diagnostic/evaluation/trade_dashboard/tabs/worst_trades.py +236 -0
ml4t/diagnostic/evaluation/trade_dashboard/types.py +129 -0
ml4t/diagnostic/evaluation/trade_shap/__init__.py +102 -0
ml4t/diagnostic/evaluation/trade_shap/alignment.py +188 -0
ml4t/diagnostic/evaluation/trade_shap/characterize.py +413 -0
ml4t/diagnostic/evaluation/trade_shap/cluster.py +302 -0
ml4t/diagnostic/evaluation/trade_shap/explain.py +208 -0
ml4t/diagnostic/evaluation/trade_shap/hypotheses/__init__.py +23 -0
ml4t/diagnostic/evaluation/trade_shap/hypotheses/generator.py +290 -0
ml4t/diagnostic/evaluation/trade_shap/hypotheses/matcher.py +251 -0
ml4t/diagnostic/evaluation/trade_shap/hypotheses/templates.yaml +467 -0
ml4t/diagnostic/evaluation/trade_shap/models.py +386 -0
ml4t/diagnostic/evaluation/trade_shap/normalize.py +116 -0
ml4t/diagnostic/evaluation/trade_shap/pipeline.py +263 -0
ml4t/diagnostic/evaluation/trade_shap_dashboard.py +283 -0
ml4t/diagnostic/evaluation/trade_shap_diagnostics.py +588 -0
ml4t/diagnostic/evaluation/validated_cv.py +535 -0
ml4t/diagnostic/evaluation/visualization.py +1050 -0
ml4t/diagnostic/evaluation/volatility/__init__.py +45 -0
ml4t/diagnostic/evaluation/volatility/analysis.py +351 -0
ml4t/diagnostic/evaluation/volatility/arch.py +258 -0
ml4t/diagnostic/evaluation/volatility/garch.py +460 -0
ml4t/diagnostic/integration/__init__.py +48 -0
ml4t/diagnostic/integration/backtest_contract.py +671 -0
ml4t/diagnostic/integration/data_contract.py +316 -0
ml4t/diagnostic/integration/engineer_contract.py +226 -0
ml4t/diagnostic/logging/__init__.py +77 -0
ml4t/diagnostic/logging/logger.py +245 -0
ml4t/diagnostic/logging/performance.py +234 -0
ml4t/diagnostic/logging/progress.py +234 -0
ml4t/diagnostic/logging/wandb.py +412 -0
ml4t/diagnostic/metrics/__init__.py +9 -0
ml4t/diagnostic/metrics/percentiles.py +128 -0
ml4t/diagnostic/py.typed +1 -0
ml4t/diagnostic/reporting/__init__.py +43 -0
ml4t/diagnostic/reporting/base.py +130 -0
ml4t/diagnostic/reporting/html_renderer.py +275 -0
ml4t/diagnostic/reporting/json_renderer.py +51 -0
ml4t/diagnostic/reporting/markdown_renderer.py +117 -0
ml4t/diagnostic/results/AGENT.md +24 -0
ml4t/diagnostic/results/__init__.py +105 -0
ml4t/diagnostic/results/barrier_results/__init__.py +36 -0
ml4t/diagnostic/results/barrier_results/hit_rate.py +304 -0
ml4t/diagnostic/results/barrier_results/precision_recall.py +266 -0
ml4t/diagnostic/results/barrier_results/profit_factor.py +297 -0
ml4t/diagnostic/results/barrier_results/tearsheet.py +397 -0
ml4t/diagnostic/results/barrier_results/time_to_target.py +305 -0
ml4t/diagnostic/results/barrier_results/validation.py +38 -0
ml4t/diagnostic/results/base.py +177 -0
ml4t/diagnostic/results/event_results.py +349 -0
ml4t/diagnostic/results/feature_results.py +787 -0
ml4t/diagnostic/results/multi_signal_results.py +431 -0
ml4t/diagnostic/results/portfolio_results.py +281 -0
ml4t/diagnostic/results/sharpe_results.py +448 -0
ml4t/diagnostic/results/signal_results/__init__.py +74 -0
ml4t/diagnostic/results/signal_results/ic.py +581 -0
ml4t/diagnostic/results/signal_results/irtc.py +110 -0
ml4t/diagnostic/results/signal_results/quantile.py +392 -0
ml4t/diagnostic/results/signal_results/tearsheet.py +456 -0
ml4t/diagnostic/results/signal_results/turnover.py +213 -0
ml4t/diagnostic/results/signal_results/validation.py +147 -0
ml4t/diagnostic/signal/AGENT.md +17 -0
ml4t/diagnostic/signal/__init__.py +69 -0
ml4t/diagnostic/signal/_report.py +152 -0
ml4t/diagnostic/signal/_utils.py +261 -0
ml4t/diagnostic/signal/core.py +275 -0
ml4t/diagnostic/signal/quantile.py +148 -0
ml4t/diagnostic/signal/result.py +214 -0
ml4t/diagnostic/signal/signal_ic.py +129 -0
ml4t/diagnostic/signal/turnover.py +182 -0
ml4t/diagnostic/splitters/AGENT.md +19 -0
ml4t/diagnostic/splitters/__init__.py +36 -0
ml4t/diagnostic/splitters/base.py +501 -0
ml4t/diagnostic/splitters/calendar.py +421 -0
ml4t/diagnostic/splitters/calendar_config.py +91 -0
ml4t/diagnostic/splitters/combinatorial.py +1064 -0
ml4t/diagnostic/splitters/config.py +322 -0
ml4t/diagnostic/splitters/cpcv/__init__.py +57 -0
ml4t/diagnostic/splitters/cpcv/combinations.py +119 -0
ml4t/diagnostic/splitters/cpcv/partitioning.py +263 -0
ml4t/diagnostic/splitters/cpcv/purge_engine.py +379 -0
ml4t/diagnostic/splitters/cpcv/windows.py +190 -0
ml4t/diagnostic/splitters/group_isolation.py +329 -0
ml4t/diagnostic/splitters/persistence.py +316 -0
ml4t/diagnostic/splitters/utils.py +207 -0
ml4t/diagnostic/splitters/walk_forward.py +757 -0
ml4t/diagnostic/utils/__init__.py +42 -0
ml4t/diagnostic/utils/config.py +542 -0
ml4t/diagnostic/utils/dependencies.py +318 -0
ml4t/diagnostic/utils/sessions.py +127 -0
ml4t/diagnostic/validation/__init__.py +54 -0
ml4t/diagnostic/validation/dataframe.py +274 -0
ml4t/diagnostic/validation/returns.py +280 -0
ml4t/diagnostic/validation/timeseries.py +299 -0
ml4t/diagnostic/visualization/AGENT.md +19 -0
ml4t/diagnostic/visualization/__init__.py +223 -0
ml4t/diagnostic/visualization/backtest/__init__.py +98 -0
ml4t/diagnostic/visualization/backtest/cost_attribution.py +762 -0
ml4t/diagnostic/visualization/backtest/executive_summary.py +895 -0
ml4t/diagnostic/visualization/backtest/interactive_controls.py +673 -0
ml4t/diagnostic/visualization/backtest/statistical_validity.py +874 -0
ml4t/diagnostic/visualization/backtest/tearsheet.py +565 -0
ml4t/diagnostic/visualization/backtest/template_system.py +373 -0
ml4t/diagnostic/visualization/backtest/trade_plots.py +1172 -0
ml4t/diagnostic/visualization/barrier_plots.py +782 -0
ml4t/diagnostic/visualization/core.py +1060 -0
ml4t/diagnostic/visualization/dashboards/__init__.py +36 -0
ml4t/diagnostic/visualization/dashboards/base.py +582 -0
ml4t/diagnostic/visualization/dashboards/importance.py +801 -0
ml4t/diagnostic/visualization/dashboards/interaction.py +263 -0
ml4t/diagnostic/visualization/dashboards.py +43 -0
ml4t/diagnostic/visualization/data_extraction/__init__.py +48 -0
ml4t/diagnostic/visualization/data_extraction/importance.py +649 -0
ml4t/diagnostic/visualization/data_extraction/interaction.py +504 -0
ml4t/diagnostic/visualization/data_extraction/types.py +113 -0
ml4t/diagnostic/visualization/data_extraction/validation.py +66 -0
ml4t/diagnostic/visualization/feature_plots.py +888 -0
ml4t/diagnostic/visualization/interaction_plots.py +618 -0
ml4t/diagnostic/visualization/portfolio/__init__.py +41 -0
ml4t/diagnostic/visualization/portfolio/dashboard.py +514 -0
ml4t/diagnostic/visualization/portfolio/drawdown_plots.py +341 -0
ml4t/diagnostic/visualization/portfolio/returns_plots.py +487 -0
ml4t/diagnostic/visualization/portfolio/risk_plots.py +301 -0
ml4t/diagnostic/visualization/report_generation.py +1343 -0
ml4t/diagnostic/visualization/signal/__init__.py +103 -0
ml4t/diagnostic/visualization/signal/dashboard.py +911 -0
ml4t/diagnostic/visualization/signal/event_plots.py +514 -0
ml4t/diagnostic/visualization/signal/ic_plots.py +635 -0
ml4t/diagnostic/visualization/signal/multi_signal_dashboard.py +974 -0
ml4t/diagnostic/visualization/signal/multi_signal_plots.py +603 -0
ml4t/diagnostic/visualization/signal/quantile_plots.py +625 -0
ml4t/diagnostic/visualization/signal/turnover_plots.py +400 -0
ml4t/diagnostic/visualization/trade_shap/__init__.py +90 -0
ml4t_diagnostic-0.1.0a1.dist-info/METADATA +1044 -0
ml4t_diagnostic-0.1.0a1.dist-info/RECORD +242 -0
ml4t_diagnostic-0.1.0a1.dist-info/WHEEL +4 -0
ml4t_diagnostic-0.1.0a1.dist-info/licenses/LICENSE +21 -0

ml4t/diagnostic/visualization/backtest/statistical_validity.py ADDED Viewed

@@ -0,0 +1,874 @@
+"""Statistical validity visualizations for backtest analysis.
+Provides interactive Plotly visualizations for statistical rigor:
+- DSR (Deflated Sharpe Ratio) gauge with probability zones
+- Confidence interval forest plots
+- RAS (Rademacher Anti-Serum) overfitting detection
+- MinTRL (Minimum Track Record Length) analysis
+These visualizations help traders understand whether their backtest results
+are statistically significant or likely due to overfitting/chance.
+"""
+from __future__ import annotations
+from typing import TYPE_CHECKING, Any, Literal
+import numpy as np
+import plotly.graph_objects as go
+from ml4t.diagnostic.visualization.core import get_theme_config
+if TYPE_CHECKING:
+    pass
+def plot_dsr_gauge(
+    dsr_probability: float,
+    observed_sharpe: float,
+    expected_max_sharpe: float | None = None,
+    n_trials: int | None = None,
+    title: str = "Deflated Sharpe Ratio",
+    show_legend: bool = True,
+    theme: str | None = None,
+    height: int = 350,
+    width: int = 500,
+) -> go.Figure:
+    """Create a gauge chart showing DSR probability.
+    The Deflated Sharpe Ratio corrects for selection bias when choosing
+    the best strategy from multiple tests. A DSR probability < 0.05
+    suggests the performance is statistically significant.
+    Parameters
+    ----------
+    dsr_probability : float
+        DSR probability value (0-1), where lower is more significant.
+        Typically displayed as 1 - dsr for "confidence" interpretation.
+    observed_sharpe : float
+        The observed Sharpe ratio being tested
+    expected_max_sharpe : float, optional
+        The expected maximum Sharpe under null hypothesis
+    n_trials : int, optional
+        Number of trials/strategies tested (for annotation)
+    title : str
+        Chart title
+    show_legend : bool
+        Whether to show the color zone legend
+    theme : str, optional
+        Theme name (default, dark, print, presentation)
+    height : int
+        Figure height in pixels
+    width : int
+        Figure width in pixels
+    Returns
+    -------
+    go.Figure
+        Plotly figure with gauge chart
+    Examples
+    --------
+    >>> fig = plot_dsr_gauge(
+    ...     dsr_probability=0.03,
+    ...     observed_sharpe=2.1,
+    ...     n_trials=100,
+    ... )
+    >>> fig.show()
+    """
+    theme_config = get_theme_config(theme)
+    # Convert to "confidence" (1 - p-value style)
+    # High confidence = good, Low confidence = bad
+    confidence = (1 - dsr_probability) * 100
+    # Color zones: Red (not significant) -> Yellow (marginal) -> Green (significant)
+    # Standard thresholds: p < 0.05 (95%), p < 0.01 (99%)
+    fig = go.Figure(
+        go.Indicator(
+            mode="gauge+number",
+            value=confidence,
+            number={"suffix": "%", "font": {"size": 36}},
+            title={"text": title, "font": {"size": 18}},
+            gauge={
+                "axis": {
+                    "range": [0, 100],
+                    "tickwidth": 1,
+                    "tickcolor": "darkgray",
+                    "tickvals": [0, 50, 90, 95, 99, 100],
+                    "ticktext": ["0%", "50%", "90%", "95%", "99%", "100%"],
+                },
+                "bar": {"color": "darkblue"},
+                "bgcolor": "white",
+                "borderwidth": 2,
+                "bordercolor": "gray",
+                "steps": [
+                    {"range": [0, 50], "color": "#EF553B"},  # Red - not significant
+                    {"range": [50, 90], "color": "#FFA15A"},  # Orange - weak
+                    {"range": [90, 95], "color": "#FECB52"},  # Yellow - marginal
+                    {"range": [95, 99], "color": "#00CC96"},  # Green - significant
+                    {"range": [99, 100], "color": "#19D3F3"},  # Cyan - highly significant
+                ],
+                "threshold": {
+                    "line": {"color": "black", "width": 4},
+                    "thickness": 0.75,
+                    "value": confidence,
+                },
+            },
+        )
+    )
+    # Add annotations
+    annotations = []
+    # DSR probability annotation
+    annotations.append(
+        {
+            "x": 0.5,
+            "y": 0.25,
+            "text": f"DSR p-value: {dsr_probability:.4f}",
+            "showarrow": False,
+            "font": {"size": 14},
+            "xref": "paper",
+            "yref": "paper",
+        }
+    )
+    # Observed Sharpe
+    annotations.append(
+        {
+            "x": 0.5,
+            "y": 0.15,
+            "text": f"Observed Sharpe: {observed_sharpe:.2f}",
+            "showarrow": False,
+            "font": {"size": 12},
+            "xref": "paper",
+            "yref": "paper",
+        }
+    )
+    # Expected max Sharpe if provided
+    if expected_max_sharpe is not None:
+        annotations.append(
+            {
+                "x": 0.5,
+                "y": 0.08,
+                "text": f"E[max SR]: {expected_max_sharpe:.2f}",
+                "showarrow": False,
+                "font": {"size": 12},
+                "xref": "paper",
+                "yref": "paper",
+            }
+        )
+    # Number of trials
+    if n_trials is not None:
+        annotations.append(
+            {
+                "x": 0.5,
+                "y": 0.01,
+                "text": f"(N={n_trials} trials)",
+                "showarrow": False,
+                "font": {"size": 11, "color": "gray"},
+                "xref": "paper",
+                "yref": "paper",
+            }
+        )
+    # Build layout
+    layout_updates = {
+        "height": height,
+        "width": width,
+        "annotations": annotations,
+        "margin": {"l": 40, "r": 40, "t": 60, "b": 40},
+    }
+    for key, value in theme_config["layout"].items():
+        if key not in layout_updates:
+            layout_updates[key] = value
+    fig.update_layout(**layout_updates)
+    return fig
+def plot_confidence_intervals(
+    metrics: dict[str, dict[str, float]],
+    confidence_levels: list[float] | None = None,
+    title: str = "Metric Confidence Intervals",
+    orientation: Literal["h", "v"] = "h",
+    show_point_estimate: bool = True,
+    theme: str | None = None,
+    height: int = 400,
+    width: int | None = None,
+) -> go.Figure:
+    """Create a forest plot showing confidence intervals for multiple metrics.
+    Visualizes bootstrap or analytical confidence intervals at multiple
+    confidence levels (e.g., 90%, 95%, 99%).
+    Parameters
+    ----------
+    metrics : dict[str, dict[str, float]]
+        Dictionary mapping metric names to their CI values.
+        Each value should have keys: 'point', 'lower_90', 'upper_90',
+        'lower_95', 'upper_95', 'lower_99', 'upper_99' (based on levels).
+    confidence_levels : list[float], optional
+        Confidence levels to display (default: [0.90, 0.95, 0.99])
+    title : str
+        Chart title
+    orientation : {"h", "v"}
+        Horizontal or vertical orientation
+    show_point_estimate : bool
+        Whether to show the point estimate marker
+    theme : str, optional
+        Theme name
+    height : int
+        Figure height in pixels
+    width : int, optional
+        Figure width in pixels
+    Returns
+    -------
+    go.Figure
+        Plotly figure with forest plot
+    Examples
+    --------
+    >>> metrics = {
+    ...     "Sharpe": {"point": 1.5, "lower_95": 0.8, "upper_95": 2.2},
+    ...     "CAGR": {"point": 0.15, "lower_95": 0.08, "upper_95": 0.22},
+    ... }
+    >>> fig = plot_confidence_intervals(metrics)
+    >>> fig.show()
+    """
+    theme_config = get_theme_config(theme)
+    colors = theme_config["colorway"]
+    if confidence_levels is None:
+        confidence_levels = [0.90, 0.95, 0.99]
+    # Sort confidence levels (widest first for plotting)
+    confidence_levels = sorted(confidence_levels, reverse=True)
+    fig = go.Figure()
+    metric_names = list(metrics.keys())
+    n_metrics = len(metric_names)
+    # Colors for different confidence levels (lighter to darker)
+    level_colors = {
+        0.99: "rgba(99, 110, 250, 0.3)",  # Lightest - widest CI
+        0.95: "rgba(99, 110, 250, 0.5)",
+        0.90: "rgba(99, 110, 250, 0.7)",  # Darkest - narrowest CI
+    }
+    for i, metric_name in enumerate(metric_names):
+        metric_data = metrics[metric_name]
+        point = metric_data.get("point", metric_data.get("estimate", 0))
+        # Plot confidence intervals from widest to narrowest
+        for level in confidence_levels:
+            level_pct = int(level * 100)
+            lower_key = f"lower_{level_pct}"
+            upper_key = f"upper_{level_pct}"
+            if lower_key in metric_data and upper_key in metric_data:
+                lower = metric_data[lower_key]
+                upper = metric_data[upper_key]
+                color = level_colors.get(level, "rgba(99, 110, 250, 0.5)")
+                if orientation == "h":
+                    fig.add_trace(
+                        go.Scatter(
+                            x=[lower, upper],
+                            y=[i, i],
+                            mode="lines",
+                            line={"color": color, "width": 8 if level == 0.95 else 5},
+                            name=f"{level_pct}% CI" if i == 0 else None,
+                            showlegend=(i == 0),
+                            hovertemplate=f"{metric_name}<br>{level_pct}% CI: [{lower:.3f}, {upper:.3f}]<extra></extra>",
+                        )
+                    )
+                else:
+                    fig.add_trace(
+                        go.Scatter(
+                            x=[i, i],
+                            y=[lower, upper],
+                            mode="lines",
+                            line={"color": color, "width": 8 if level == 0.95 else 5},
+                            name=f"{level_pct}% CI" if i == 0 else None,
+                            showlegend=(i == 0),
+                            hovertemplate=f"{metric_name}<br>{level_pct}% CI: [{lower:.3f}, {upper:.3f}]<extra></extra>",
+                        )
+                    )
+        # Add point estimate
+        if show_point_estimate:
+            if orientation == "h":
+                fig.add_trace(
+                    go.Scatter(
+                        x=[point],
+                        y=[i],
+                        mode="markers",
+                        marker={"color": colors[0], "size": 12, "symbol": "diamond"},
+                        name="Point Estimate" if i == 0 else None,
+                        showlegend=(i == 0),
+                        hovertemplate=f"{metric_name}: {point:.3f}<extra></extra>",
+                    )
+                )
+            else:
+                fig.add_trace(
+                    go.Scatter(
+                        x=[i],
+                        y=[point],
+                        mode="markers",
+                        marker={"color": colors[0], "size": 12, "symbol": "diamond"},
+                        name="Point Estimate" if i == 0 else None,
+                        showlegend=(i == 0),
+                        hovertemplate=f"{metric_name}: {point:.3f}<extra></extra>",
+                    )
+                )
+    # Add zero reference line for Sharpe-like metrics
+    if orientation == "h":
+        fig.add_vline(x=0, line_dash="dash", line_color="gray", line_width=1)
+    else:
+        fig.add_hline(y=0, line_dash="dash", line_color="gray", line_width=1)
+    # Build layout
+    if orientation == "h":
+        layout_updates = {
+            "title": {"text": title, "font": {"size": 18}},
+            "height": max(height, n_metrics * 60 + 100),
+            "xaxis": {"title": "Value", "zeroline": True},
+            "yaxis": {
+                "tickvals": list(range(n_metrics)),
+                "ticktext": metric_names,
+                "autorange": "reversed",
+            },
+            "legend": {"yanchor": "top", "y": 0.99, "xanchor": "right", "x": 0.99},
+        }
+    else:
+        layout_updates = {
+            "title": {"text": title, "font": {"size": 18}},
+            "height": height,
+            "yaxis": {"title": "Value", "zeroline": True},
+            "xaxis": {
+                "tickvals": list(range(n_metrics)),
+                "ticktext": metric_names,
+            },
+            "legend": {"yanchor": "top", "y": 0.99, "xanchor": "right", "x": 0.99},
+        }
+    if width:
+        layout_updates["width"] = width
+    for key, value in theme_config["layout"].items():
+        if key not in layout_updates:
+            layout_updates[key] = value
+    fig.update_layout(**layout_updates)
+    return fig
+def plot_ras_analysis(
+    original_ic: float,
+    adjusted_ic: float,
+    rademacher_complexity: float,
+    kappa: float = 0.02,
+    n_features: int | None = None,
+    n_observations: int | None = None,
+    title: str = "Rademacher Anti-Serum Analysis",
+    theme: str | None = None,
+    height: int = 400,
+    width: int = 600,
+) -> go.Figure:
+    """Visualize Rademacher Anti-Serum (RAS) overfitting adjustment.
+    The RAS method adjusts Information Coefficients for data mining bias
+    by estimating the Rademacher complexity of the strategy search space.
+    Parameters
+    ----------
+    original_ic : float
+        Original (unadjusted) Information Coefficient
+    adjusted_ic : float
+        RAS-adjusted Information Coefficient
+    rademacher_complexity : float
+        Estimated Rademacher complexity R̂
+    kappa : float
+        The practical bound parameter used (default: 0.02)
+    n_features : int, optional
+        Number of features/strategies tested
+    n_observations : int, optional
+        Number of observations
+    title : str
+        Chart title
+    theme : str, optional
+        Theme name
+    height : int
+        Figure height in pixels
+    width : int
+        Figure width in pixels
+    Returns
+    -------
+    go.Figure
+        Plotly figure with RAS analysis
+    Notes
+    -----
+    The RAS adjustment is:
+    IC_adj = max(0, IC_original - 2 * (R̂ + κ))
+    where R̂ is the Rademacher complexity and κ is a practical bound.
+    """
+    theme_config = get_theme_config(theme)
+    colors = theme_config["colorway"]
+    # Calculate the haircut percentage
+    haircut_pct = (1 - adjusted_ic / original_ic) * 100 if original_ic != 0 else 100
+    # Create waterfall chart
+    fig = go.Figure()
+    categories = ["Original IC", "Rademacher (2R̂)", "Practical κ", "Adjusted IC"]
+    values = [original_ic, -2 * rademacher_complexity, -2 * kappa, adjusted_ic]
+    measures = ["absolute", "relative", "relative", "total"]
+    fig.add_trace(
+        go.Waterfall(
+            name="RAS Adjustment",
+            orientation="v",
+            x=categories,
+            y=values,
+            measure=measures,
+            text=[f"{v:.4f}" for v in values],
+            textposition="outside",
+            decreasing={"marker": {"color": "#EF553B"}},
+            increasing={"marker": {"color": colors[0]}},
+            totals={"marker": {"color": "#00CC96" if adjusted_ic > 0 else "#EF553B"}},
+            connector={"line": {"color": "rgba(128, 128, 128, 0.5)", "width": 2}},
+        )
+    )
+    # Add annotations
+    annotations = []
+    # Haircut percentage
+    annotations.append(
+        {
+            "x": 0.5,
+            "y": -0.15,
+            "text": f"IC Haircut: {haircut_pct:.1f}%  |  R̂ = {rademacher_complexity:.4f}  |  κ = {kappa:.4f}",
+            "showarrow": False,
+            "font": {"size": 12},
+            "xref": "paper",
+            "yref": "paper",
+        }
+    )
+    # Significance indicator
+    if adjusted_ic > 0:
+        sig_text = "Statistically significant after RAS adjustment"
+        sig_color = "#00CC96"
+    else:
+        sig_text = "Not significant after RAS adjustment (IC ≤ 0)"
+        sig_color = "#EF553B"
+    annotations.append(
+        {
+            "x": 0.5,
+            "y": -0.22,
+            "text": sig_text,
+            "showarrow": False,
+            "font": {"size": 13, "color": sig_color, "weight": "bold"},
+            "xref": "paper",
+            "yref": "paper",
+        }
+    )
+    # N and T if provided
+    if n_features is not None and n_observations is not None:
+        annotations.append(
+            {
+                "x": 0.5,
+                "y": 1.08,
+                "text": f"N={n_features} features, T={n_observations} observations",
+                "showarrow": False,
+                "font": {"size": 11, "color": "gray"},
+                "xref": "paper",
+                "yref": "paper",
+            }
+        )
+    # Build layout
+    layout_updates = {
+        "title": {"text": title, "font": {"size": 18}},
+        "height": height,
+        "width": width,
+        "yaxis": {"title": "Information Coefficient"},
+        "showlegend": False,
+        "annotations": annotations,
+        "margin": {"l": 60, "r": 40, "t": 80, "b": 100},
+    }
+    for key, value in theme_config["layout"].items():
+        if key not in layout_updates:
+            layout_updates[key] = value
+    fig.update_layout(**layout_updates)
+    return fig
+def plot_minimum_track_record(
+    observed_sharpe: float,
+    current_periods: int,
+    sr_benchmark: float = 0.0,
+    confidence: float = 0.95,
+    max_periods: int | None = None,
+    periods_per_year: int = 252,
+    title: str = "Minimum Track Record Length",
+    theme: str | None = None,
+    height: int = 400,
+    width: int | None = None,
+) -> go.Figure:
+    """Visualize minimum track record length (MinTRL) analysis.
+    Shows how many periods are needed to achieve statistical significance
+    for the observed Sharpe ratio, and whether the current track record
+    is sufficient.
+    Parameters
+    ----------
+    observed_sharpe : float
+        The observed Sharpe ratio (annualized)
+    current_periods : int
+        Current number of observation periods
+    sr_benchmark : float
+        Benchmark Sharpe ratio for comparison (default: 0)
+    confidence : float
+        Target confidence level (default: 0.95)
+    max_periods : int, optional
+        Maximum periods to show on x-axis
+    periods_per_year : int
+        Periods per year for time conversion (default: 252 for daily)
+    title : str
+        Chart title
+    theme : str, optional
+        Theme name
+    height : int
+        Figure height in pixels
+    width : int, optional
+        Figure width in pixels
+    Returns
+    -------
+    go.Figure
+        Plotly figure with MinTRL analysis
+    Notes
+    -----
+    The minimum track record length formula is:
+    MinTRL = 1 + (1 - γ₃*SR + γ₄*SR²/4) * (z_α / SR)²
+    where γ₃ is skewness, γ₄ is excess kurtosis, and z_α is the
+    critical value for confidence level α.
+    """
+    from scipy import stats
+    theme_config = get_theme_config(theme)
+    colors = theme_config["colorway"]
+    # Calculate MinTRL (simplified, assuming normal returns)
+    z_alpha = stats.norm.ppf(confidence)
+    sharpe_diff = observed_sharpe - sr_benchmark
+    if sharpe_diff <= 0:
+        min_trl = float("inf")
+    else:
+        # Simplified MinTRL (assuming γ₃=0, γ₄=3)
+        min_trl = (z_alpha / sharpe_diff) ** 2
+    # Convert to years
+    min_trl_years = min_trl / periods_per_year if min_trl != float("inf") else float("inf")
+    current_years = current_periods / periods_per_year
+    # Determine max periods for x-axis
+    if max_periods is None:
+        if min_trl != float("inf"):
+            max_periods = int(max(min_trl * 1.5, current_periods * 1.2))
+        else:
+            max_periods = current_periods * 2
+    # Generate data for the required SR curve at different track record lengths
+    periods_range = np.linspace(10, max_periods, 100)
+    # Required SR to achieve significance at each track record length
+    # SR_required = z_alpha / sqrt(T)
+    required_sr = z_alpha / np.sqrt(periods_range) + sr_benchmark
+    fig = go.Figure()
+    # Required SR curve
+    fig.add_trace(
+        go.Scatter(
+            x=periods_range / periods_per_year,
+            y=required_sr,
+            mode="lines",
+            name=f"{int(confidence * 100)}% Significance Threshold",
+            line={"color": colors[1] if len(colors) > 1 else "orange", "width": 2, "dash": "dash"},
+            fill="tozeroy",
+            fillcolor="rgba(239, 85, 59, 0.2)",
+            hovertemplate="Track Record: %{x:.1f} years<br>Required SR: %{y:.2f}<extra></extra>",
+        )
+    )
+    # Horizontal line at observed Sharpe
+    fig.add_trace(
+        go.Scatter(
+            x=[0, max_periods / periods_per_year],
+            y=[observed_sharpe, observed_sharpe],
+            mode="lines",
+            name=f"Observed SR: {observed_sharpe:.2f}",
+            line={"color": colors[0], "width": 3},
+            hovertemplate="Observed Sharpe: %{y:.2f}<extra></extra>",
+        )
+    )
+    # Current position marker
+    is_significant = current_periods >= min_trl
+    marker_color = "#00CC96" if is_significant else "#EF553B"
+    fig.add_trace(
+        go.Scatter(
+            x=[current_years],
+            y=[observed_sharpe],
+            mode="markers",
+            name="Current Position",
+            marker={"color": marker_color, "size": 15, "symbol": "star"},
+            hovertemplate=f"Current: {current_years:.1f} years<br>SR: {observed_sharpe:.2f}<extra></extra>",
+        )
+    )
+    # Add vertical line at MinTRL
+    if min_trl != float("inf") and min_trl <= max_periods:
+        fig.add_vline(
+            x=min_trl_years,
+            line_dash="dot",
+            line_color="gray",
+            annotation_text=f"MinTRL: {min_trl_years:.1f}y",
+            annotation_position="top",
+        )
+    # Add significance zone annotation
+    annotations = []
+    if is_significant:
+        status_text = (
+            f"Track record sufficient ({current_years:.1f}y ≥ MinTRL {min_trl_years:.1f}y)"
+        )
+        status_color = "#00CC96"
+    elif min_trl == float("inf"):
+        status_text = "Cannot achieve significance (SR ≤ benchmark)"
+        status_color = "#EF553B"
+    else:
+        deficit = min_trl_years - current_years
+        status_text = f"Need {deficit:.1f} more years (MinTRL: {min_trl_years:.1f}y)"
+        status_color = "#FFA15A"
+    annotations.append(
+        {
+            "x": 0.5,
+            "y": -0.15,
+            "text": status_text,
+            "showarrow": False,
+            "font": {"size": 13, "color": status_color, "weight": "bold"},
+            "xref": "paper",
+            "yref": "paper",
+        }
+    )
+    # Build layout
+    layout_updates = {
+        "title": {"text": title, "font": {"size": 18}},
+        "height": height,
+        "xaxis": {"title": "Track Record Length (Years)", "rangemode": "tozero"},
+        "yaxis": {"title": "Sharpe Ratio", "rangemode": "tozero"},
+        "legend": {"yanchor": "top", "y": 0.99, "xanchor": "right", "x": 0.99},
+        "annotations": annotations,
+        "margin": {"b": 80},
+    }
+    if width:
+        layout_updates["width"] = width
+    for key, value in theme_config["layout"].items():
+        if key not in layout_updates:
+            layout_updates[key] = value
+    fig.update_layout(**layout_updates)
+    return fig
+def plot_statistical_summary_card(
+    metrics: dict[str, Any],
+    title: str = "Statistical Validity Summary",
+    theme: str | None = None,
+    height: int = 300,
+    width: int = 700,
+) -> go.Figure:
+    """Create an executive summary card for statistical validity checks.
+    Combines multiple statistical tests into a single traffic-light display
+    showing overall strategy validity.
+    Parameters
+    ----------
+    metrics : dict[str, Any]
+        Dictionary with statistical metrics. Expected keys:
+        - dsr_probability: DSR p-value
+        - dsr_significant: bool
+        - min_trl: minimum track record length
+        - current_trl: current track record length
+        - trl_sufficient: bool
+        - ras_adjusted_ic: RAS-adjusted IC (optional)
+        - ras_significant: bool (optional)
+    title : str
+        Chart title
+    theme : str, optional
+        Theme name
+    height : int
+        Figure height in pixels
+    width : int
+        Figure width in pixels
+    Returns
+    -------
+    go.Figure
+        Plotly figure with summary card
+    """
+    theme_config = get_theme_config(theme)
+    # Extract metrics with defaults
+    dsr_prob = metrics.get("dsr_probability", None)
+    dsr_sig = metrics.get("dsr_significant", None)
+    min_trl = metrics.get("min_trl", None)
+    current_trl = metrics.get("current_trl", None)
+    trl_sufficient = metrics.get("trl_sufficient", None)
+    ras_ic = metrics.get("ras_adjusted_ic", None)
+    ras_sig = metrics.get("ras_significant", None)
+    # Build indicators
+    indicators = []
+    # DSR check
+    if dsr_prob is not None:
+        if dsr_sig:
+            indicators.append(("DSR", f"p={dsr_prob:.3f}", "green", "Significant"))
+        elif dsr_prob < 0.10:
+            indicators.append(("DSR", f"p={dsr_prob:.3f}", "yellow", "Marginal"))
+        else:
+            indicators.append(("DSR", f"p={dsr_prob:.3f}", "red", "Not Significant"))
+    # MinTRL check
+    if min_trl is not None and current_trl is not None:
+        if trl_sufficient:
+            indicators.append(
+                ("Track Record", f"{current_trl:.0f}/{min_trl:.0f}", "green", "Sufficient")
+            )
+        else:
+            indicators.append(
+                ("Track Record", f"{current_trl:.0f}/{min_trl:.0f}", "red", "Insufficient")
+            )
+    # RAS check
+    if ras_ic is not None:
+        if ras_sig:
+            indicators.append(("RAS IC", f"{ras_ic:.4f}", "green", "Significant"))
+        else:
+            indicators.append(("RAS IC", f"{ras_ic:.4f}", "red", "Not Significant"))
+    if not indicators:
+        indicators = [("No Data", "-", "gray", "No statistical tests available")]
+    # Create table-like figure
+    n_cols = len(indicators)
+    # Color mapping
+    color_map = {
+        "green": "#00CC96",
+        "yellow": "#FECB52",
+        "red": "#EF553B",
+        "gray": "#888888",
+    }
+    fig = go.Figure()
+    for i, (name, value, color, status) in enumerate(indicators):
+        x_pos = (i + 0.5) / n_cols
+        # Status icon (colored circle)
+        fig.add_annotation(
+            x=x_pos,
+            y=0.75,
+            text="●",
+            showarrow=False,
+            font={"size": 40, "color": color_map[color]},
+            xref="paper",
+            yref="paper",
+        )
+        # Metric name
+        fig.add_annotation(
+            x=x_pos,
+            y=0.5,
+            text=f"<b>{name}</b>",
+            showarrow=False,
+            font={"size": 14},
+            xref="paper",
+            yref="paper",
+        )
+        # Value
+        fig.add_annotation(
+            x=x_pos,
+            y=0.35,
+            text=value,
+            showarrow=False,
+            font={"size": 12},
+            xref="paper",
+            yref="paper",
+        )
+        # Status text
+        fig.add_annotation(
+            x=x_pos,
+            y=0.2,
+            text=status,
+            showarrow=False,
+            font={"size": 11, "color": color_map[color]},
+            xref="paper",
+            yref="paper",
+        )
+    # Build layout
+    layout_updates = {
+        "title": {"text": title, "font": {"size": 18}, "x": 0.5},
+        "height": height,
+        "width": width,
+        "xaxis": {"visible": False, "range": [0, 1]},
+        "yaxis": {"visible": False, "range": [0, 1]},
+        "margin": {"l": 20, "r": 20, "t": 60, "b": 20},
+    }
+    for key, value in theme_config["layout"].items():
+        if key not in layout_updates:
+            layout_updates[key] = value
+    fig.update_layout(**layout_updates)
+    return fig