PyPI - birdnet-analyzer - Versions diffs - 2.0.1__py3-none-any.whl → 2.1.1__py3-none-any.whl - Mend

birdnet-analyzer 2.0.1py3-none-any.whl → 2.1.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (121) hide show

birdnet_analyzer/__init__.py +9 -9
birdnet_analyzer/analyze/__init__.py +19 -5
birdnet_analyzer/analyze/__main__.py +3 -3
birdnet_analyzer/analyze/cli.py +30 -25
birdnet_analyzer/analyze/core.py +268 -241
birdnet_analyzer/analyze/utils.py +700 -692
birdnet_analyzer/audio.py +368 -368
birdnet_analyzer/cli.py +732 -709
birdnet_analyzer/config.py +243 -242
birdnet_analyzer/eBird_taxonomy_codes_2024E.json +13046 -0
birdnet_analyzer/embeddings/__init__.py +3 -3
birdnet_analyzer/embeddings/__main__.py +3 -3
birdnet_analyzer/embeddings/cli.py +12 -12
birdnet_analyzer/embeddings/core.py +70 -69
birdnet_analyzer/embeddings/utils.py +173 -179
birdnet_analyzer/evaluation/__init__.py +189 -196
birdnet_analyzer/evaluation/__main__.py +3 -3
birdnet_analyzer/evaluation/assessment/metrics.py +388 -388
birdnet_analyzer/evaluation/assessment/performance_assessor.py +364 -409
birdnet_analyzer/evaluation/assessment/plotting.py +378 -379
birdnet_analyzer/evaluation/preprocessing/data_processor.py +631 -631
birdnet_analyzer/evaluation/preprocessing/utils.py +98 -98
birdnet_analyzer/gui/__init__.py +19 -19
birdnet_analyzer/gui/__main__.py +3 -3
birdnet_analyzer/gui/analysis.py +179 -175
birdnet_analyzer/gui/assets/arrow_down.svg +4 -4
birdnet_analyzer/gui/assets/arrow_left.svg +4 -4
birdnet_analyzer/gui/assets/arrow_right.svg +4 -4
birdnet_analyzer/gui/assets/arrow_up.svg +4 -4
birdnet_analyzer/gui/assets/gui.css +36 -28
birdnet_analyzer/gui/assets/gui.js +89 -93
birdnet_analyzer/gui/embeddings.py +638 -619
birdnet_analyzer/gui/evaluation.py +801 -795
birdnet_analyzer/gui/localization.py +75 -75
birdnet_analyzer/gui/multi_file.py +265 -245
birdnet_analyzer/gui/review.py +472 -519
birdnet_analyzer/gui/segments.py +191 -191
birdnet_analyzer/gui/settings.py +149 -128
birdnet_analyzer/gui/single_file.py +264 -267
birdnet_analyzer/gui/species.py +95 -95
birdnet_analyzer/gui/train.py +687 -696
birdnet_analyzer/gui/utils.py +803 -810
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_af.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_ar.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_bg.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_ca.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_cs.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_da.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_de.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_el.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_en_uk.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_es.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_fi.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_fr.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_he.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_hr.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_hu.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_in.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_is.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_it.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_ja.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_ko.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_lt.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_ml.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_nl.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_no.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_pl.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_pt_BR.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_pt_PT.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_ro.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_ru.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_sk.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_sl.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_sr.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_sv.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_th.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_tr.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_uk.txt +6522 -6522
birdnet_analyzer/labels/V2.4/BirdNET_GLOBAL_6K_V2.4_Labels_zh.txt +6522 -6522
birdnet_analyzer/lang/de.json +342 -334
birdnet_analyzer/lang/en.json +342 -334
birdnet_analyzer/lang/fi.json +342 -334
birdnet_analyzer/lang/fr.json +342 -334
birdnet_analyzer/lang/id.json +342 -334
birdnet_analyzer/lang/pt-br.json +342 -334
birdnet_analyzer/lang/ru.json +342 -334
birdnet_analyzer/lang/se.json +342 -334
birdnet_analyzer/lang/tlh.json +342 -334
birdnet_analyzer/lang/zh_TW.json +342 -334
birdnet_analyzer/model.py +1213 -1212
birdnet_analyzer/search/__init__.py +3 -3
birdnet_analyzer/search/__main__.py +3 -3
birdnet_analyzer/search/cli.py +11 -11
birdnet_analyzer/search/core.py +78 -78
birdnet_analyzer/search/utils.py +104 -107
birdnet_analyzer/segments/__init__.py +3 -3
birdnet_analyzer/segments/__main__.py +3 -3
birdnet_analyzer/segments/cli.py +13 -13
birdnet_analyzer/segments/core.py +81 -81
birdnet_analyzer/segments/utils.py +383 -383
birdnet_analyzer/species/__init__.py +3 -3
birdnet_analyzer/species/__main__.py +3 -3
birdnet_analyzer/species/cli.py +13 -13
birdnet_analyzer/species/core.py +35 -35
birdnet_analyzer/species/utils.py +73 -74
birdnet_analyzer/train/__init__.py +3 -3
birdnet_analyzer/train/__main__.py +3 -3
birdnet_analyzer/train/cli.py +13 -13
birdnet_analyzer/train/core.py +113 -113
birdnet_analyzer/train/utils.py +878 -877
birdnet_analyzer/translate.py +132 -133
birdnet_analyzer/utils.py +425 -426
{birdnet_analyzer-2.0.1.dist-info → birdnet_analyzer-2.1.1.dist-info}/METADATA +147 -137
birdnet_analyzer-2.1.1.dist-info/RECORD +124 -0
{birdnet_analyzer-2.0.1.dist-info → birdnet_analyzer-2.1.1.dist-info}/WHEEL +1 -1
{birdnet_analyzer-2.0.1.dist-info → birdnet_analyzer-2.1.1.dist-info}/licenses/LICENSE +18 -18
birdnet_analyzer/eBird_taxonomy_codes_2021E.json +0 -25280
birdnet_analyzer/playground.py +0 -5
birdnet_analyzer-2.0.1.dist-info/RECORD +0 -125
{birdnet_analyzer-2.0.1.dist-info → birdnet_analyzer-2.1.1.dist-info}/entry_points.txt +0 -0
{birdnet_analyzer-2.0.1.dist-info → birdnet_analyzer-2.1.1.dist-info}/top_level.txt +0 -0

birdnet_analyzer/evaluation/assessment/plotting.py CHANGED Viewed

@@ -1,379 +1,378 @@
-"""
-Module containing functions to plot performance metrics.
-This script provides a variety of functions to visualize performance metrics in different formats,
-including bar charts, line plots, and heatmaps. These visualizations help analyze metrics such as
-overall performance, per-class performance, and performance across thresholds.
-Functions:
-    - plot_overall_metrics: Plots a bar chart for overall performance metrics.
-    - plot_metrics_per_class: Plots metric values per class with unique lines and colors.
-    - plot_metrics_across_thresholds: Plots metrics across different thresholds.
-    - plot_metrics_across_thresholds_per_class: Plots metrics across thresholds for each class.
-    - plot_confusion_matrices: Visualizes confusion matrices for binary, multiclass, or multilabel tasks.
-"""
-from typing import Literal
-import matplotlib.pyplot as plt
-import numpy as np
-import pandas as pd
-import seaborn as sns
-def plot_overall_metrics(metrics_df: pd.DataFrame, colors: list[str]) -> plt.Figure:
-    """
-    Plots a bar chart for overall performance metrics.
-    Args:
-        metrics_df (pd.DataFrame): DataFrame containing metric names as index and an 'Overall' column.
-        colors (List[str]): List of colors for the bars.
-    Raises:
-        TypeError: If `metrics_df` is not a DataFrame or `colors` is not a list.
-        KeyError: If 'Overall' column is missing in `metrics_df`.
-        ValueError: If `metrics_df` is empty.
-    Returns:
-        plt.Figure
-    """
-    # Validate input types and content
-    if not isinstance(metrics_df, pd.DataFrame):
-        raise TypeError("metrics_df must be a pandas DataFrame.")
-    if "Overall" not in metrics_df.columns:
-        raise KeyError("metrics_df must contain an 'Overall' column.")
-    if metrics_df.empty:
-        raise ValueError("metrics_df is empty.")
-    if not isinstance(colors, list):
-        raise TypeError("colors must be a list.")
-    if len(colors) == 0:
-        # Default to matplotlib's color cycle if colors are not provided
-        colors = plt.rcParams["axes.prop_cycle"].by_key()["color"]
-    # Extract metric names and values
-    metrics = metrics_df.index  # Metric names
-    values = metrics_df["Overall"].to_numpy()  # Metric values
-    # Plot bar chart
-    fig = plt.figure(figsize=(10, 6))
-    plt.bar(metrics, values, color=colors[: len(metrics)])
-    # Add titles, labels, and format
-    plt.title("Overall Metric Scores", fontsize=16)
-    plt.xlabel("Metrics", fontsize=12)
-    plt.ylabel("Score", fontsize=12)
-    plt.xticks(rotation=45, ha="right", fontsize=10)
-    plt.grid(axis="y", linestyle="--", alpha=0.7)
-    plt.tight_layout()
-    return fig
-def plot_metrics_per_class(metrics_df: pd.DataFrame, colors: list[str]) -> plt.Figure:
-    """
-    Plots metric values per class, with each metric represented by a distinct color and line.
-    Args:
-        metrics_df (pd.DataFrame): DataFrame containing metrics as index and class names as columns.
-        colors (List[str]): List of colors for the lines.
-    Raises:
-        TypeError: If inputs are not of expected types.
-        ValueError: If `metrics_df` is empty.
-    Returns:
-        plt.Figure
-    """
-    # Validate inputs
-    if not isinstance(metrics_df, pd.DataFrame):
-        raise TypeError("metrics_df must be a pandas DataFrame.")
-    if metrics_df.empty:
-        raise ValueError("metrics_df is empty.")
-    if not isinstance(colors, list):
-        raise TypeError("colors must be a list.")
-    if len(colors) == 0:
-        # Default to matplotlib's color cycle if colors are not provided
-        colors = plt.rcParams["axes.prop_cycle"].by_key()["color"]
-    # Line styles for distinction
-    line_styles = ["-", "--", "-.", ":", (0, (5, 10)), (0, (5, 5)), (0, (3, 5, 1, 5))]
-    fig = plt.figure(figsize=(10, 6))
-    # Loop over each metric and plot it
-    for i, metric_name in enumerate(metrics_df.index):
-        values = metrics_df.loc[metric_name]  # Metric values for each class
-        classes = metrics_df.columns  # Class labels
-        plt.plot(
-            classes,
-            values,
-            label=metric_name,
-            marker="o",
-            markersize=8,
-            linewidth=2,
-            linestyle=line_styles[i % len(line_styles)],
-            color=colors[i % len(colors)],
-        )
-    # Add titles, labels, legend, and format
-    plt.title("Metric Scores per Class", fontsize=16)
-    plt.xlabel("Class", fontsize=12)
-    plt.ylabel("Score", fontsize=12)
-    plt.legend(loc="lower right")
-    plt.grid(True)
-    plt.tight_layout()
-    return fig
-def plot_metrics_across_thresholds(
-    thresholds: np.ndarray,
-    metric_values_dict: dict[str, np.ndarray],
-    metrics_to_plot: list[str],
-    colors: list[str],
-) -> plt.Figure:
-    """
-    Plots metrics across different thresholds.
-    Args:
-        thresholds (np.ndarray): Array of threshold values.
-        metric_values_dict (Dict[str, np.ndarray]): Dictionary mapping metric names to their values.
-        metrics_to_plot (List[str]): List of metric names to plot.
-        colors (List[str]): List of colors for the lines.
-    Raises:
-        TypeError: If inputs are not of expected types.
-        ValueError: If thresholds or metric values have mismatched lengths.
-    Returns:
-        plt.Figure
-    """
-    # Validate inputs
-    if not isinstance(thresholds, np.ndarray):
-        raise TypeError("thresholds must be a numpy ndarray.")
-    if thresholds.size == 0:
-        raise ValueError("thresholds array is empty.")
-    if not isinstance(metric_values_dict, dict):
-        raise TypeError("metric_values_dict must be a dictionary.")
-    if not isinstance(metrics_to_plot, list):
-        raise TypeError("metrics_to_plot must be a list.")
-    if not isinstance(colors, list):
-        raise TypeError("colors must be a list.")
-    if len(colors) == 0:
-        # Default to matplotlib's color cycle if colors are not provided
-        colors = plt.rcParams["axes.prop_cycle"].by_key()["color"]
-    # Line styles for distinction
-    line_styles = ["-", "--", "-.", ":", (0, (5, 10)), (0, (5, 5)), (0, (3, 5, 1, 5))]
-    fig = plt.figure(figsize=(10, 6))
-    # Plot each metric against thresholds
-    for i, metric_name in enumerate(metrics_to_plot):
-        if metric_name not in metric_values_dict:
-            raise KeyError(f"Metric '{metric_name}' not found in metric_values_dict.")
-        metric_values = metric_values_dict[metric_name]
-        if len(metric_values) != len(thresholds):
-            raise ValueError(f"Length of metric '{metric_name}' values does not match length of thresholds.")
-        plt.plot(
-            thresholds,
-            metric_values,
-            label=metric_name.capitalize(),
-            linestyle=line_styles[i % len(line_styles)],
-            linewidth=2,
-            color=colors[i % len(colors)],
-        )
-    # Add titles, labels, legend, and format
-    plt.title("Metrics across Different Thresholds", fontsize=16)
-    plt.xlabel("Threshold", fontsize=12)
-    plt.ylabel("Metric Score", fontsize=12)
-    plt.legend(loc="best")
-    plt.grid(True)
-    plt.tight_layout()
-    return fig
-def plot_metrics_across_thresholds_per_class(
-    thresholds: np.ndarray,
-    metric_values_dict_per_class: dict[str, dict[str, np.ndarray]],
-    metrics_to_plot: list[str],
-    class_names: list[str],
-    colors: list[str],
-) -> plt.Figure:
-    """
-    Plots metrics across different thresholds per class.
-    Args:
-        thresholds (np.ndarray): Array of threshold values.
-        metric_values_dict_per_class (Dict[str, Dict[str, np.ndarray]]): Dictionary mapping class names
-            to metric dictionaries, each containing metric names and their values across thresholds.
-        metrics_to_plot (List[str]): List of metric names to plot.
-        class_names (List[str]): List of class names.
-        colors (List[str]): List of colors for the lines.
-    Raises:
-        TypeError: If inputs are not of expected types.
-        ValueError: If inputs have mismatched lengths or are empty.
-    Returns:
-        plt.Figure
-    """
-    # Validate inputs
-    if not isinstance(thresholds, np.ndarray):
-        raise TypeError("thresholds must be a numpy ndarray.")
-    if thresholds.size == 0:
-        raise ValueError("thresholds array is empty.")
-    if not isinstance(metric_values_dict_per_class, dict):
-        raise TypeError("metric_values_dict_per_class must be a dictionary.")
-    if not isinstance(metrics_to_plot, list):
-        raise TypeError("metrics_to_plot must be a list.")
-    if not isinstance(class_names, list):
-        raise TypeError("class_names must be a list.")
-    if not isinstance(colors, list):
-        raise TypeError("colors must be a list.")
-    if len(colors) == 0:
-        # Default to matplotlib's color cycle if colors are not provided
-        colors = plt.rcParams["axes.prop_cycle"].by_key()["color"]
-    num_classes = len(class_names)
-    if num_classes == 0:
-        raise ValueError("class_names list is empty.")
-    # Determine grid size for subplots
-    n_cols = int(np.ceil(np.sqrt(num_classes)))
-    n_rows = int(np.ceil(num_classes / n_cols))
-    # Create subplots
-    fig, axes = plt.subplots(n_rows, n_cols, figsize=(n_cols * 5, n_rows * 4))
-    # Flatten axes for easy indexing
-    axes = [axes] if num_classes == 1 else axes.flatten()
-    # Line styles for distinction
-    line_styles = ["-", "--", "-.", ":", (0, (5, 10)), (0, (5, 5)), (0, (3, 5, 1, 5))]
-    # Plot each class
-    for class_idx, class_name in enumerate(class_names):
-        if class_name not in metric_values_dict_per_class:
-            raise KeyError(f"Class '{class_name}' not found in metric_values_dict_per_class.")
-        ax = axes[class_idx]
-        metric_values_dict = metric_values_dict_per_class[class_name]
-        # Plot each metric for the current class
-        for i, metric_name in enumerate(metrics_to_plot):
-            if metric_name not in metric_values_dict:
-                raise KeyError(f"Metric '{metric_name}' not found for class '{class_name}'.")
-            metric_values = metric_values_dict[metric_name]
-            if len(metric_values) != len(thresholds):
-                raise ValueError(
-                    f"Length of metric '{metric_name}' values for class '{class_name}' "
-                    + "does not match length of thresholds."
-                )
-            ax.plot(
-                thresholds,
-                metric_values,
-                label=metric_name.capitalize(),
-                linestyle=line_styles[i % len(line_styles)],
-                linewidth=2,
-                color=colors[i % len(colors)],
-            )
-        # Add titles and labels for each subplot
-        ax.set_title(f"{class_name}", fontsize=12)
-        ax.set_xlabel("Threshold", fontsize=10)
-        ax.set_ylabel("Metric Score", fontsize=10)
-        ax.legend(loc="best", fontsize=8)
-        ax.grid(True)
-    # Hide any unused subplots
-    for j in range(num_classes, len(axes)):
-        fig.delaxes(axes[j])
-    # Adjust layout and show
-    plt.tight_layout()
-    return fig
-def plot_confusion_matrices(
-    conf_mat: np.ndarray,
-    task: Literal["binary", "multiclass", "multilabel"],
-    class_names: list[str],
-) -> plt.Figure:
-    """
-    Plots confusion matrices for each class in a single figure with multiple subplots.
-    Args:
-        conf_mat (np.ndarray): Confusion matrix or matrices. For binary classification, a single 2x2 matrix.
-            For multilabel or multiclass, an array of shape (num_classes, 2, 2).
-        task (Literal["binary", "multiclass", "multilabel"]): Task type.
-        class_names (List[str]): List of class names.
-    Raises:
-        TypeError: If inputs are not of expected types.
-        ValueError: If confusion matrix dimensions or task specifications are invalid.
-    Returns:
-        plt.Figure
-    """
-    # Validate inputs
-    if not isinstance(conf_mat, np.ndarray):
-        raise TypeError("conf_mat must be a numpy ndarray.")
-    if conf_mat.size == 0:
-        raise ValueError("conf_mat is empty.")
-    if not isinstance(task, str) or task not in ["binary", "multiclass", "multilabel"]:
-        raise ValueError("Invalid task. Expected 'binary', 'multiclass', or 'multilabel'.")
-    if not isinstance(class_names, list):
-        raise TypeError("class_names must be a list.")
-    if len(class_names) == 0:
-        raise ValueError("class_names list is empty.")
-    if task == "binary":
-        # Binary classification expects a single 2x2 matrix
-        if conf_mat.shape != (2, 2):
-            raise ValueError("For binary task, conf_mat must be of shape (2, 2).")
-        if len(class_names) != 2:
-            raise ValueError("For binary task, class_names must have exactly two elements.")
-        # Plot single confusion matrix
-        fig = plt.figure(figsize=(4, 4))
-        sns.heatmap(conf_mat, annot=True, fmt=".2f", cmap="Reds", cbar=False)
-        plt.title("Confusion Matrix")
-        plt.xlabel("Predicted Class")
-        plt.ylabel("True Class")
-        plt.tight_layout()
-    else:
-        # Multilabel or multiclass expects a set of 2x2 matrices
-        num_labels = conf_mat.shape[0]
-        if conf_mat.shape[1:] != (2, 2):
-            raise ValueError("For multilabel or multiclass task, conf_mat must have shape (num_labels, 2, 2).")
-        if len(class_names) != num_labels:
-            raise ValueError("Length of class_names must match number of labels in conf_mat.")
-        # Determine grid size for subplots
-        n_cols = int(np.ceil(np.sqrt(num_labels)))
-        n_rows = int(np.ceil(num_labels / n_cols))
-        # Create subplots
-        fig, axes = plt.subplots(n_rows, n_cols, figsize=(n_cols * 2, n_rows * 2))
-        # Flatten axes for easy indexing
-        axes = [axes] if num_labels == 1 else axes.flatten()
-        # Plot each class's confusion matrix
-        for i in range(num_labels):
-            cm = conf_mat[i]
-            ax = axes[i]
-            sns.heatmap(cm, annot=True, fmt=".2f", cmap="Reds", cbar=False, ax=ax)
-            ax.set_title(f"{class_names[i]}")
-            ax.set_xlabel("Predicted Class")
-            ax.set_ylabel("True Class")
-        # Hide any unused subplots
-        for j in range(num_labels, len(axes)):
-            fig.delaxes(axes[j])
-        # Adjust layout and show
-        plt.tight_layout()
-    return fig
+"""
+Module containing functions to plot performance metrics.
+This script provides a variety of functions to visualize performance metrics in different formats,
+including bar charts, line plots, and heatmaps. These visualizations help analyze metrics such as
+overall performance, per-class performance, and performance across thresholds.
+Functions:
+    - plot_overall_metrics: Plots a bar chart for overall performance metrics.
+    - plot_metrics_per_class: Plots metric values per class with unique lines and colors.
+    - plot_metrics_across_thresholds: Plots metrics across different thresholds.
+    - plot_metrics_across_thresholds_per_class: Plots metrics across thresholds for each class.
+    - plot_confusion_matrices: Visualizes confusion matrices for binary, multiclass, or multilabel tasks.
+"""
+from typing import Literal
+import matplotlib.pyplot as plt
+import numpy as np
+import pandas as pd
+from sklearn.metrics import ConfusionMatrixDisplay
+MATPLOTLIB_BINARY_CONFUSION_MATRIX_FIGURE_NUM = "performance-tab-binary-confusion-matrix-plot"
+MATPLOTLIB_MULTICLASS_CONFUSION_MATRIX_FIGURE_NUM = "performance-tab-multiclass-confusion-matrix-plot"
+MATPLOTLIB_OVERALL_METRICS_FIGURE_NUM = "performance-tab-overall-metrics-plot"
+MATPLOTLIB_PER_CLASS_METRICS_FIGURE_NUM = "performance-tab-per-class-metrics-plot"
+MATPLOTLIB_ACROSS_METRICS_THRESHOLDS_FIGURE_NUM = "performance-tab-metrics-across-thresholds-plot"
+MATPLOTLIB_ACROSS_METRICS_THRESHOLDS_PER_CLASS_FIGURE_NUM = "performance-tab-metrics-across-thresholds-per-class-plot"
+def plot_overall_metrics(metrics_df: pd.DataFrame, colors: list[str]):
+    """
+    Plots a bar chart for overall performance metrics.
+    Args:
+        metrics_df (pd.DataFrame): DataFrame containing metric names as index and an 'Overall' column.
+        colors (List[str]): List of colors for the bars.
+    Raises:
+        TypeError: If `metrics_df` is not a DataFrame or `colors` is not a list.
+        KeyError: If 'Overall' column is missing in `metrics_df`.
+        ValueError: If `metrics_df` is empty.
+    Returns:
+        plt.Figure
+    """
+    # Validate input types and content
+    if not isinstance(metrics_df, pd.DataFrame):
+        raise TypeError("metrics_df must be a pandas DataFrame.")
+    if "Overall" not in metrics_df.columns:
+        raise KeyError("metrics_df must contain an 'Overall' column.")
+    if metrics_df.empty:
+        raise ValueError("metrics_df is empty.")
+    if not isinstance(colors, list):
+        raise TypeError("colors must be a list.")
+    if len(colors) == 0:
+        # Default to matplotlib's color cycle if colors are not provided
+        colors = plt.rcParams["axes.prop_cycle"].by_key()["color"]
+    # Extract metric names and values
+    metrics = metrics_df.index  # Metric names
+    values = metrics_df["Overall"].to_numpy()  # Metric values
+    # Plot bar chart
+    fig = plt.figure(MATPLOTLIB_OVERALL_METRICS_FIGURE_NUM, figsize=(10, 6))
+    fig.clear()
+    fig.tight_layout(pad=0)
+    fig.set_dpi(300)
+    plt.bar(metrics, values, color=colors[: len(metrics)])
+    # Add titles, labels, and format
+    plt.title("Overall Metric Scores", fontsize=16)
+    plt.xlabel("Metrics", fontsize=12)
+    plt.ylabel("Score", fontsize=12)
+    plt.xticks(rotation=45, ha="right", fontsize=10)
+    plt.grid(axis="y", linestyle="--", alpha=0.7)
+    return fig
+def plot_metrics_per_class(metrics_df: pd.DataFrame, colors: list[str]):
+    """
+    Plots metric values per class, with each metric represented by a distinct color and line.
+    Args:
+        metrics_df (pd.DataFrame): DataFrame containing metrics as index and class names as columns.
+        colors (List[str]): List of colors for the lines.
+    Raises:
+        TypeError: If inputs are not of expected types.
+        ValueError: If `metrics_df` is empty.
+    Returns:
+        plt.Figure
+    """
+    # Validate inputs
+    if not isinstance(metrics_df, pd.DataFrame):
+        raise TypeError("metrics_df must be a pandas DataFrame.")
+    if metrics_df.empty:
+        raise ValueError("metrics_df is empty.")
+    if not isinstance(colors, list):
+        raise TypeError("colors must be a list.")
+    if len(colors) == 0:
+        # Default to matplotlib's color cycle if colors are not provided
+        colors = plt.rcParams["axes.prop_cycle"].by_key()["color"]
+    # Line styles for distinction
+    line_styles = ["-", "--", "-.", ":", (0, (5, 10)), (0, (5, 5)), (0, (3, 5, 1, 5))]
+    fig = plt.figure(MATPLOTLIB_OVERALL_METRICS_FIGURE_NUM, figsize=(10, 6))
+    fig.clear()
+    fig.tight_layout(pad=0)
+    fig.set_dpi(300)
+    # Loop over each metric and plot it
+    for i, metric_name in enumerate(metrics_df.index):
+        values = metrics_df.loc[metric_name]  # Metric values for each class
+        classes = metrics_df.columns  # Class labels
+        plt.plot(
+            classes,
+            values,
+            label=metric_name,
+            marker="o",
+            markersize=8,
+            linewidth=2,
+            linestyle=line_styles[i % len(line_styles)],
+            color=colors[i % len(colors)],
+        )
+    # Add titles, labels, legend, and format
+    plt.title("Metric Scores per Class", fontsize=16)
+    plt.xlabel("Class", fontsize=12)
+    plt.ylabel("Score", fontsize=12)
+    plt.legend(loc="lower right")
+    plt.grid(True)
+    return fig
+def plot_metrics_across_thresholds(
+    thresholds: np.ndarray,
+    metric_values_dict: dict[str, np.ndarray],
+    metrics_to_plot: list[str],
+    colors: list[str],
+):
+    """
+    Plots metrics across different thresholds.
+    Args:
+        thresholds (np.ndarray): Array of threshold values.
+        metric_values_dict (Dict[str, np.ndarray]): Dictionary mapping metric names to their values.
+        metrics_to_plot (List[str]): List of metric names to plot.
+        colors (List[str]): List of colors for the lines.
+    Raises:
+        TypeError: If inputs are not of expected types.
+        ValueError: If thresholds or metric values have mismatched lengths.
+    Returns:
+        plt.Figure
+    """
+    # Validate inputs
+    if not isinstance(thresholds, np.ndarray):
+        raise TypeError("thresholds must be a numpy ndarray.")
+    if thresholds.size == 0:
+        raise ValueError("thresholds array is empty.")
+    if not isinstance(metric_values_dict, dict):
+        raise TypeError("metric_values_dict must be a dictionary.")
+    if not isinstance(metrics_to_plot, list):
+        raise TypeError("metrics_to_plot must be a list.")
+    if not isinstance(colors, list):
+        raise TypeError("colors must be a list.")
+    if len(colors) == 0:
+        # Default to matplotlib's color cycle if colors are not provided
+        colors = plt.rcParams["axes.prop_cycle"].by_key()["color"]
+    # Line styles for distinction
+    line_styles = ["-", "--", "-.", ":", (0, (5, 10)), (0, (5, 5)), (0, (3, 5, 1, 5))]
+    fig = plt.figure(MATPLOTLIB_ACROSS_METRICS_THRESHOLDS_FIGURE_NUM, figsize=(10, 6))
+    fig.clear()
+    fig.tight_layout(pad=0)
+    fig.set_dpi(300)
+    # Plot each metric against thresholds
+    for i, metric_name in enumerate(metrics_to_plot):
+        if metric_name not in metric_values_dict:
+            raise KeyError(f"Metric '{metric_name}' not found in metric_values_dict.")
+        metric_values = metric_values_dict[metric_name]
+        if len(metric_values) != len(thresholds):
+            raise ValueError(f"Length of metric '{metric_name}' values does not match length of thresholds.")
+        plt.plot(
+            thresholds,
+            metric_values,
+            label=metric_name.capitalize(),
+            linestyle=line_styles[i % len(line_styles)],
+            linewidth=2,
+            color=colors[i % len(colors)],
+        )
+    # Add titles, labels, legend, and format
+    plt.title("Metrics across Different Thresholds", fontsize=16)
+    plt.xlabel("Threshold", fontsize=12)
+    plt.ylabel("Metric Score", fontsize=12)
+    plt.legend(loc="best")
+    plt.grid(True)
+    return fig
+def plot_metrics_across_thresholds_per_class(
+    thresholds: np.ndarray,
+    metric_values_dict_per_class: dict[str, dict[str, np.ndarray]],
+    metrics_to_plot: list[str],
+    class_names: list[str],
+    colors: list[str],
+):
+    """
+    Plots metrics across different thresholds per class.
+    Args:
+        thresholds (np.ndarray): Array of threshold values.
+        metric_values_dict_per_class (Dict[str, Dict[str, np.ndarray]]): Dictionary mapping class names
+            to metric dictionaries, each containing metric names and their values across thresholds.
+        metrics_to_plot (List[str]): List of metric names to plot.
+        class_names (List[str]): List of class names.
+        colors (List[str]): List of colors for the lines.
+    Raises:
+        TypeError: If inputs are not of expected types.
+        ValueError: If inputs have mismatched lengths or are empty.
+    Returns:
+        plt.Figure
+    """
+    # Validate inputs
+    if not isinstance(thresholds, np.ndarray):
+        raise TypeError("thresholds must be a numpy ndarray.")
+    if thresholds.size == 0:
+        raise ValueError("thresholds array is empty.")
+    if not isinstance(metric_values_dict_per_class, dict):
+        raise TypeError("metric_values_dict_per_class must be a dictionary.")
+    if not isinstance(metrics_to_plot, list):
+        raise TypeError("metrics_to_plot must be a list.")
+    if not isinstance(class_names, list):
+        raise TypeError("class_names must be a list.")
+    if not isinstance(colors, list):
+        raise TypeError("colors must be a list.")
+    if len(colors) == 0:
+        # Default to matplotlib's color cycle if colors are not provided
+        colors = plt.rcParams["axes.prop_cycle"].by_key()["color"]
+    num_classes = len(class_names)
+    if num_classes == 0:
+        raise ValueError("class_names list is empty.")
+    # Determine grid size for subplots
+    n_cols = int(np.ceil(np.sqrt(num_classes)))
+    n_rows = int(np.ceil(num_classes / n_cols))
+    # Create subplots
+    fig, axes = plt.subplots(n_rows, n_cols, figsize=(n_cols * 5, n_rows * 4), num=MATPLOTLIB_ACROSS_METRICS_THRESHOLDS_PER_CLASS_FIGURE_NUM)
+    fig.clear()
+    fig.tight_layout(pad=0)
+    fig.set_dpi(300)
+    # Flatten axes for easy indexing
+    axes = [axes] if num_classes == 1 else axes.flatten()
+    # Line styles for distinction
+    line_styles = ["-", "--", "-.", ":", (0, (5, 10)), (0, (5, 5)), (0, (3, 5, 1, 5))]
+    # Plot each class
+    for class_idx, class_name in enumerate(class_names):
+        if class_name not in metric_values_dict_per_class:
+            raise KeyError(f"Class '{class_name}' not found in metric_values_dict_per_class.")
+        ax = axes[class_idx]
+        metric_values_dict = metric_values_dict_per_class[class_name]
+        # Plot each metric for the current class
+        for i, metric_name in enumerate(metrics_to_plot):
+            if metric_name not in metric_values_dict:
+                raise KeyError(f"Metric '{metric_name}' not found for class '{class_name}'.")
+            metric_values = metric_values_dict[metric_name]
+            if len(metric_values) != len(thresholds):
+                raise ValueError(f"Length of metric '{metric_name}' values for class '{class_name}' " + "does not match length of thresholds.")
+            ax.plot(
+                thresholds,
+                metric_values,
+                label=metric_name.capitalize(),
+                linestyle=line_styles[i % len(line_styles)],
+                linewidth=2,
+                color=colors[i % len(colors)],
+            )
+        # Add titles and labels for each subplot
+        ax.set_title(f"{class_name}", fontsize=12)
+        ax.set_xlabel("Threshold", fontsize=10)
+        ax.set_ylabel("Metric Score", fontsize=10)
+        ax.legend(loc="best", fontsize=8)
+        ax.grid(True)
+    return fig
+def plot_confusion_matrices(
+    conf_mat: np.ndarray,
+    task: Literal["binary", "multiclass", "multilabel"],
+    class_names: list[str],
+):
+    """
+    Plots confusion matrices for each class in a single figure with multiple subplots.
+    Args:
+        conf_mat (np.ndarray): Confusion matrix or matrices. For binary classification, a single 2x2 matrix.
+            For multilabel or multiclass, an array of shape (num_classes, 2, 2).
+        task (Literal["binary", "multiclass", "multilabel"]): Task type.
+        class_names (List[str]): List of class names.
+    Raises:
+        TypeError: If inputs are not of expected types.
+        ValueError: If confusion matrix dimensions or task specifications are invalid.
+    Returns:
+        plt.Figure
+    """
+    # Validate inputs
+    if not isinstance(conf_mat, np.ndarray):
+        raise TypeError("conf_mat must be a numpy ndarray.")
+    if conf_mat.size == 0:
+        raise ValueError("conf_mat is empty.")
+    if not isinstance(task, str) or task not in ["binary", "multiclass", "multilabel"]:
+        raise ValueError("Invalid task. Expected 'binary', 'multiclass', or 'multilabel'.")
+    if task == "binary":
+        # Binary classification expects a single 2x2 matrix
+        if conf_mat.shape != (2, 2):
+            raise ValueError("For binary task, conf_mat must be of shape (2, 2).")
+        disp = ConfusionMatrixDisplay(confusion_matrix=conf_mat, display_labels=["Negative", "Positive"])
+        fig, ax = plt.subplots(num=MATPLOTLIB_BINARY_CONFUSION_MATRIX_FIGURE_NUM, figsize=(6, 6))
+        fig.tight_layout()
+        fig.set_dpi(300)
+        disp.plot(cmap="Reds", ax=ax, colorbar=False, values_format=".2f")
+        ax.set_title("Confusion Matrix")
+    else:
+        # Multilabel or multiclass expects a set of 2x2 matrices
+        num_matrices = conf_mat.shape[0]
+        if conf_mat.shape[1:] != (2, 2):
+            raise ValueError("For multilabel or multiclass task, conf_mat must have shape (num_labels, 2, 2).")
+        if len(class_names) != num_matrices:
+            raise ValueError("Length of class_names must match number of labels in conf_mat.")
+        # Determine grid size for subplots
+        n_cols = int(np.ceil(np.sqrt(num_matrices)))
+        n_rows = int(np.ceil(num_matrices / n_cols))
+        # Create subplots for each confusion matrix
+        fig, axes = plt.subplots(n_rows, n_cols, figsize=(4 * n_cols, 4 * n_rows), num=MATPLOTLIB_MULTICLASS_CONFUSION_MATRIX_FIGURE_NUM)
+        fig.set_dpi(300)
+        axes = axes.flatten() if hasattr(axes, "flatten") else [axes]
+        # Plot each confusion matrix
+        for idx, (cf, class_name) in enumerate(zip(conf_mat, class_names, strict=True)):
+            disp = ConfusionMatrixDisplay(confusion_matrix=cf, display_labels=["Negative", "Positive"])
+            disp.plot(cmap="Reds", ax=axes[idx], colorbar=False, values_format=".2f")
+            axes[idx].set_title(f"{class_name}")
+            axes[idx].set_xlabel("Predicted class")
+            axes[idx].set_ylabel("True class")
+        # Remove unused subplot axes
+        for ax in axes[num_matrices:]:
+            fig.delaxes(ax)
+        plt.tight_layout()
+    return fig

birdnet-analyzer 2.0.1__py3-none-any.whl → 2.1.1__py3-none-any.whl

birdnet-analyzer 2.0.1py3-none-any.whl → 2.1.1py3-none-any.whl