PyPI - MIDRC-MELODY - Versions diffs - 0.3.3__py3-none-any.whl - Mend

MIDRC-MELODY 0.3.3__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (37) hide show

MIDRC_MELODY/__init__.py +0 -0
MIDRC_MELODY/__main__.py +4 -0
MIDRC_MELODY/common/__init__.py +0 -0
MIDRC_MELODY/common/data_loading.py +199 -0
MIDRC_MELODY/common/data_preprocessing.py +134 -0
MIDRC_MELODY/common/edit_config.py +156 -0
MIDRC_MELODY/common/eod_aaod_metrics.py +292 -0
MIDRC_MELODY/common/generate_eod_aaod_spiders.py +69 -0
MIDRC_MELODY/common/generate_qwk_spiders.py +56 -0
MIDRC_MELODY/common/matplotlib_spider.py +425 -0
MIDRC_MELODY/common/plot_tools.py +132 -0
MIDRC_MELODY/common/plotly_spider.py +217 -0
MIDRC_MELODY/common/qwk_metrics.py +244 -0
MIDRC_MELODY/common/table_tools.py +230 -0
MIDRC_MELODY/gui/__init__.py +0 -0
MIDRC_MELODY/gui/config_editor.py +200 -0
MIDRC_MELODY/gui/data_loading.py +157 -0
MIDRC_MELODY/gui/main_controller.py +154 -0
MIDRC_MELODY/gui/main_window.py +545 -0
MIDRC_MELODY/gui/matplotlib_spider_widget.py +204 -0
MIDRC_MELODY/gui/metrics_model.py +62 -0
MIDRC_MELODY/gui/plotly_spider_widget.py +56 -0
MIDRC_MELODY/gui/qchart_spider_widget.py +272 -0
MIDRC_MELODY/gui/shared/__init__.py +0 -0
MIDRC_MELODY/gui/shared/react/__init__.py +0 -0
MIDRC_MELODY/gui/shared/react/copyabletableview.py +100 -0
MIDRC_MELODY/gui/shared/react/grabbablewidget.py +406 -0
MIDRC_MELODY/gui/tqdm_handler.py +210 -0
MIDRC_MELODY/melody.py +102 -0
MIDRC_MELODY/melody_gui.py +111 -0
MIDRC_MELODY/resources/MIDRC.ico +0 -0
midrc_melody-0.3.3.dist-info/METADATA +151 -0
midrc_melody-0.3.3.dist-info/RECORD +37 -0
midrc_melody-0.3.3.dist-info/WHEEL +5 -0
midrc_melody-0.3.3.dist-info/entry_points.txt +4 -0
midrc_melody-0.3.3.dist-info/licenses/LICENSE +201 -0
midrc_melody-0.3.3.dist-info/top_level.txt +1 -0

MIDRC_MELODY/common/eod_aaod_metrics.py ADDED Viewed

@@ -0,0 +1,292 @@
+#  Copyright (c) 2025 Medical Imaging and Data Resource Center (MIDRC).
+#
+#      Licensed under the Apache License, Version 2.0 (the "License");
+#      you may not use this file except in compliance with the License.
+#      You may obtain a copy of the License at
+#
+#         http://www.apache.org/licenses/LICENSE-2.0
+#
+#      Unless required by applicable law or agreed to in writing, software
+#      distributed under the License is distributed on an "AS IS" BASIS,
+#      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#      See the License for the specific language governing permissions and
+#      limitations under the License.
+#
+""" EOD and AAOD metric calculation and plotting functions. """
+from typing import Any, Dict, List, Optional, Tuple, Union
+from joblib import delayed, Parallel
+import matplotlib.pyplot as plt
+import numpy as np
+import pandas as pd
+from sklearn.utils import resample
+from tqdm import tqdm
+from tqdm_joblib import tqdm_joblib
+from MIDRC_MELODY.common.data_loading import check_required_columns, TestAndDemographicData
+from MIDRC_MELODY.common.plot_tools import SpiderPlotData
+from MIDRC_MELODY.common.matplotlib_spider import plot_spider_chart, display_figures_grid
+def binarize_scores(df: pd.DataFrame, truth_col: str, ai_cols: Union[List[str], str], threshold: int = 4
+                    ) -> pd.DataFrame:
+    """
+    Binarize scores based on a threshold for truth and AI columns.
+    Converts values greater than or equal to threshold to 1, else 0.
+    :arg df: DataFrame containing truth and test columns.
+    :arg truth_col: Name of the truth column.
+    :arg ai_cols: Name of the test column or a list of test columns.
+    :arg threshold: Threshold value for binarization.
+    :returns: DataFrame with binarized columns.
+    """
+    if not isinstance(ai_cols, list):
+        ai_cols = [ai_cols]
+    cols = [truth_col] + ai_cols
+    check_required_columns(df, cols)
+    df[cols] = (df[cols] >= threshold).astype(int)
+    return df
+def resample_by_column(df: pd.DataFrame, col: Union[str, List[str]], seed: int) -> pd.DataFrame:
+    """
+    Resample each group in a DataFrame by the specified column
+    using the same seed across groups.
+    :arg df: DataFrame to resample.
+    :arg col: Column to group by.
+    :arg seed: Seed for reproducibility across groups.
+    :returns: Resampled DataFrame.
+    """
+    sampled_groups = [
+        resample(group_df, replace=True, n_samples=len(group_df), random_state=seed)
+        for _, group_df in df.groupby(col)
+    ]
+    return pd.concat(sampled_groups)
+def compute_bootstrap_eod_aaod(
+    df: pd.DataFrame,
+    category: str,
+    ref_group: Any,
+    group_value: Any,
+    truth_col: str,
+    ai_columns: List[str],
+    seed: int
+) -> Dict[str, Tuple[float, float]]:
+    """
+    Compute bootstrap estimates for EOD and AAOD metrics.
+    :arg df: DataFrame containing truth and test columns.
+    :arg category: Column to group by.
+    :arg ref_group: Reference group value.
+    :arg group_value: Group value to compare against reference.
+    :arg truth_col: Name of the truth column.
+    :arg ai_columns: List of test columns.
+    :arg seed: Seed for reproducibility.
+    :returns: Dictionary of EOD and AAOD values for each model.
+    """
+    sample_df = resample_by_column(df, [category, truth_col], seed)
+    ref_df = sample_df[sample_df[category] == ref_group]
+    group_df = sample_df[sample_df[category] == group_value]
+    # Precompute truth masks for both reference and group DataFrames
+    ref_truth_pos = (ref_df[truth_col] == 1)
+    ref_truth_neg = ~ref_truth_pos
+    group_truth_pos = (group_df[truth_col] == 1)
+    group_truth_neg = ~group_truth_pos
+    results: Dict[str, Tuple[float, float]] = {}
+    for model in ai_columns:
+        ref_pred = (ref_df[model] == 1)
+        group_pred = (group_df[model] == 1)
+        tpr_ref = ref_pred[ref_truth_pos].sum() / ref_truth_pos.sum() if ref_truth_pos.sum() else np.nan
+        fpr_ref = ref_pred[ref_truth_neg].sum() / ref_truth_neg.sum() if ref_truth_neg.sum() else np.nan
+        tpr_group = group_pred[group_truth_pos].sum() / group_truth_pos.sum() if group_truth_pos.sum() else np.nan
+        fpr_group = group_pred[group_truth_neg].sum() / group_truth_neg.sum() if group_truth_neg.sum() else np.nan
+        eod = tpr_group - tpr_ref
+        aaod = 0.5 * (abs(fpr_group - fpr_ref) + abs(tpr_group - tpr_ref))
+        results[model] = (eod, aaod)
+    return results
+def calculate_eod_aaod(
+    test_data: TestAndDemographicData
+) -> Dict[str, Dict[str, Dict[Any, Dict[str, Any]]]]:
+    """
+    Calculate EOD and AAOD metrics with bootstrap iterations for multiple categories.
+    :arg test_data: Test and demographic data.
+    :returns: Dictionary of EOD and AAOD values for each model.
+    """
+    ai_columns = test_data.test_cols
+    eod_aaod: Dict[str, Dict[str, Dict[Any, Dict[str, Any]]]] = {
+        category: {model: {} for model in ai_columns} for category in test_data.categories
+    }
+    rng = np.random.default_rng(test_data.base_seed)
+    for category in tqdm(test_data.categories, desc='Categories', position=0):
+        if category not in test_data.valid_groups:
+            continue
+        ref_group = test_data.reference_groups[category]
+        unique_values = test_data.matched_df[category].unique()
+        for group_value in tqdm(unique_values, desc=f"Category \'{category}\' Groups", leave=False, position=1):
+            if group_value == ref_group or group_value not in test_data.valid_groups[category]:
+                continue
+            eod_samples = {model: [] for model in ai_columns}
+            aaod_samples = {model: [] for model in ai_columns}
+            # Preassign seeds for each bootstrap iteration.
+            seeds = rng.integers(0, 1_000_000, size=test_data.n_iter)
+            with tqdm_joblib(total=test_data.n_iter, desc=f"Bootstrapping \'{group_value}\' Group", leave=False):
+                bootstrap_results = Parallel(n_jobs=-1)(
+                    delayed(compute_bootstrap_eod_aaod)(
+                        test_data.matched_df, category, ref_group, group_value, test_data.truth_col, ai_columns, seed
+                    ) for seed in seeds
+                )
+            for result in bootstrap_results:
+                for model in ai_columns:
+                    eod_samples[model].append(result[model][0])
+                    aaod_samples[model].append(result[model][1])
+            for model in ai_columns:
+                eod_median = np.median(eod_samples[model])
+                aaod_median = np.median(aaod_samples[model])
+                eod_ci = np.percentile(eod_samples[model], [2.5, 97.5])
+                aaod_ci = np.percentile(aaod_samples[model], [2.5, 97.5])
+                eod_aaod[category][model][group_value] = {
+                    'eod': (eod_median, eod_ci),
+                    'aaod': (aaod_median, aaod_ci)
+                }
+    return eod_aaod
+def extract_plot_data_eod_aaod(
+    eod_aaod: Dict[str, Dict[str, Dict[Any, Dict[str, Any]]]],
+    model: str,
+    metric: str = 'eod'
+) -> Tuple[List[str], List[float], List[float], List[float]]:
+    """
+    Extract groups, metric values and confidence intervals for plotting.
+    :arg eod_aaod: Dictionary of EOD and AAOD values for each model.
+    :arg model: Name of the model to extract data for.
+    :arg metric: Metric to extract data for (EOD or AAOD).
+    :returns: Tuple of groups, values, lower bounds and upper bounds.
+    """
+    groups: List[str] = []
+    values: List[float] = []
+    lower_bounds: List[float] = []
+    upper_bounds: List[float] = []
+    for category, model_data in eod_aaod.items():
+        if model in model_data:
+            for group, metric_list in model_data[model].items():
+                groups.append(f"{category}: {group}")
+                value, (lower, upper) = metric_list[metric]
+                values.append(value)
+                lower_bounds.append(lower)
+                upper_bounds.append(upper)
+    return groups, values, lower_bounds, upper_bounds
+def generate_plot_data_eod_aaod(
+    eod_aaod: Dict[str, Dict[str, Dict[Any, Dict[str, Any]]]],
+    test_cols: List[str],
+    metrics: List[str] = ('eod', 'aaod')
+) -> Tuple[Dict[str, Dict[str, Tuple[List[str], List[float], List[float], List[float]]]],
+           Dict[str, float], Dict[str, float]]:
+    """
+    Generate plot data for each metric and compute global axis limits.
+    :arg eod_aaod: Dictionary of EOD and AAOD values for each model.
+    :arg test_cols: List of test columns.
+    :arg metrics: List of metrics to plot.
+    :returns: Tuple of plot data dictionary, global minimum and maximum values.
+    """
+    plot_data_dict: Dict[str, Dict[str, Tuple[List[str], List[float], List[float], List[float]]]] = {}
+    global_min = {}
+    global_max = {}
+    for metric in metrics:
+        all_values: List[float] = []
+        plot_data_dict[metric] = {}
+        for model in test_cols:
+            groups, values, lower, upper = extract_plot_data_eod_aaod(eod_aaod, model, metric)
+            plot_data_dict[metric][model] = (groups, values, lower, upper)
+            all_values.extend(lower + upper)
+        global_min[metric], global_max[metric] = min(all_values) - 0.05, max(all_values) + 0.05
+    return plot_data_dict, global_min, global_max
+def create_spider_plot_data_eod_aaod(
+    plot_data_dict: Dict[str, Dict[str, Tuple[List[str], List[float], List[float], List[float]]]],
+    test_cols: List[str],
+    metrics: List[str] = ('eod', 'aaod'),
+    base_plot_data: Optional[SpiderPlotData] = None,
+) -> List[SpiderPlotData]:
+    plot_data_list: List[SpiderPlotData] = []
+    if base_plot_data is None:
+        base_plot_data = SpiderPlotData()
+    for metric in metrics:
+        for model in test_cols:
+            # Create a new copy based on the base instance
+            plot_data = SpiderPlotData(**base_plot_data.__dict__)
+            plot_data.metric = metric
+            plot_data.model_name = model
+            plot_data.groups, plot_data.values, plot_data.lower_bounds, plot_data.upper_bounds = \
+                plot_data_dict[metric][model]
+            plot_data_list.append(plot_data)
+    return plot_data_list
+def plot_data_eod_aaod(
+    plot_data_dict: Dict[str, Dict[str, Tuple[List[str], List[float], List[float], List[float]]]],
+    test_cols: List[str],
+    metrics: List[str] = ('eod', 'aaod'),
+    base_plot_data: Optional[SpiderPlotData] = None,
+) -> Dict[str, List[plt.Figure]]:
+    """
+    Plot EOD and AAOD spider charts for each model.
+    :arg plot_data_dict: Dictionary of plot data for each metric.
+    :arg test_cols: List of test columns.
+    :arg metrics: List of metrics to plot.
+    :arg base_plot_data: Base SpiderPlotData instance for plot configuration.
+    :returns: Dictionary of generated figures for each metric.
+    """
+    plot_data_list = create_spider_plot_data_eod_aaod(plot_data_dict, test_cols, metrics, base_plot_data)
+    figures_dict: Dict[str, List[Any]] = {metric: [] for metric in metrics}
+    for plot_data in plot_data_list:
+        fig = plot_spider_chart(plot_data)
+        figures_dict[plot_data.metric].append(fig)
+    grid_figs = []
+    for figures in figures_dict.values():
+        grid_fig = display_figures_grid(figures)
+        grid_figs.append(grid_fig)
+    # all_figs = [fig for figs in figures_dict.values() for fig in figs] + [g for g in grid_figs if g is not None]
+    return figures_dict

MIDRC_MELODY/common/generate_eod_aaod_spiders.py ADDED Viewed

@@ -0,0 +1,69 @@
+#  Copyright (c) 2025 Medical Imaging and Data Resource Center (MIDRC).
+#
+#      Licensed under the Apache License, Version 2.0 (the "License");
+#      you may not use this file except in compliance with the License.
+#      You may obtain a copy of the License at
+#
+#         http://www.apache.org/licenses/LICENSE-2.0
+#
+#      Unless required by applicable law or agreed to in writing, software
+#      distributed under the License is distributed on an "AS IS" BASIS,
+#      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#      See the License for the specific language governing permissions and
+#      limitations under the License.
+#
+"""This script generates EOD and AAOD spider plots for multiple models across different categories."""
+from dataclasses import replace
+import matplotlib.pyplot as plt
+from pylab import get_current_fig_manager
+import yaml
+from MIDRC_MELODY.common.data_loading import build_test_and_demographic_data, save_pickled_data
+from MIDRC_MELODY.common.eod_aaod_metrics import (binarize_scores, calculate_eod_aaod, generate_plot_data_eod_aaod,
+                                                  plot_data_eod_aaod)
+from MIDRC_MELODY.common.plot_tools import SpiderPlotData
+from MIDRC_MELODY.common.table_tools import print_table_of_nonzero_eod_aaod
+def generate_eod_aaod_spiders(cfg_path: str = "config.yaml"):
+    # Load configuration
+    with open(cfg_path, 'r', encoding='utf-8') as stream:
+        config = yaml.load(stream, Loader=yaml.CLoader)
+    # Load data
+    t_data = build_test_and_demographic_data(config)
+    # Binarize scores
+    threshold = config['binary threshold']
+    matched_df = binarize_scores(t_data.matched_df, t_data.truth_col, t_data.test_cols, threshold=threshold)
+    test_data = replace(t_data, matched_df=matched_df)
+    # Calculate EOD and AAOD
+    eod_aaod = calculate_eod_aaod(test_data)
+    # Print tables for EOD and AAOD using median values
+    print_table_of_nonzero_eod_aaod(eod_aaod, tablefmt="rounded_outline")
+    # Generate and save plots
+    metrics = ['eod', 'aaod']
+    plot_data_dict, global_min, global_max = generate_plot_data_eod_aaod(eod_aaod, test_data.test_cols, metrics=metrics)
+    # Save the EOD and AAOD data
+    for metric in metrics:
+        save_pickled_data(config['output'], metric, plot_data_dict[metric])
+    base_plot_data = SpiderPlotData(ylim_min=global_min, ylim_max=global_max, plot_config=config['plot'])
+    figures_dict = plot_data_eod_aaod(plot_data_dict,                    # noqa: F841
+                                      test_data.test_cols,
+                                      metrics=metrics,
+                                      base_plot_data=base_plot_data,
+                                      )
+    print("\nClose all figures to continue...", flush=True)
+    plt.show()
+if __name__ == '__main__':
+    generate_eod_aaod_spiders()

MIDRC_MELODY/common/generate_qwk_spiders.py ADDED Viewed

@@ -0,0 +1,56 @@
+#  Copyright (c) 2025 Medical Imaging and Data Resource Center (MIDRC).
+#
+#      Licensed under the Apache License, Version 2.0 (the "License");
+#      you may not use this file except in compliance with the License.
+#      You may obtain a copy of the License at
+#
+#         http://www.apache.org/licenses/LICENSE-2.0
+#
+#      Unless required by applicable law or agreed to in writing, software
+#      distributed under the License is distributed on an "AS IS" BASIS,
+#      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#      See the License for the specific language governing permissions and
+#      limitations under the License.
+#
+"""This script generates QWK spider plots for multiple models across different categories."""
+import matplotlib.pyplot as plt
+import yaml
+from MIDRC_MELODY.common.data_loading import build_test_and_demographic_data, save_pickled_data
+from MIDRC_MELODY.common.qwk_metrics import (calculate_delta_kappa, calculate_kappas_and_intervals,
+                                             generate_plots_from_delta_kappas)
+from MIDRC_MELODY.common.table_tools import print_table_of_nonzero_deltas
+def generate_qwk_spiders(cfg_path: str = "config.yaml"):
+    # Load configuration
+    with open(cfg_path, 'r', encoding='utf-8') as stream:
+        config = yaml.load(stream, Loader=yaml.CLoader)
+    # Load data
+    test_data = build_test_and_demographic_data(config)
+    # Calculate Kappas and intervals, prints the table of Kappas and intervals
+    kappas, intervals = calculate_kappas_and_intervals(test_data)
+    # Bootstrap delta QWKs
+    print("Bootstrapping ∆κ, this may take a while", flush=True)
+    delta_kappas = calculate_delta_kappa(test_data)
+    # Print the table of non-zero delta Kappas
+    print_table_of_nonzero_deltas(delta_kappas, tablefmt="rounded_outline")
+    # Save the delta Kappas
+    save_pickled_data(config['output'], "QWK", delta_kappas)
+    # Generate and save plots
+    generate_plots_from_delta_kappas(delta_kappas, test_data.test_cols, plot_config=config['plot'])
+    print("\nClose all figures to continue...", flush=True)
+    plt.show()
+if __name__ == '__main__':
+    generate_qwk_spiders()