PyPI - spacr - Versions diffs - 1.0.9__py3-none-any.whl → 1.1.1__py3-none-any.whl - Mend

spacr 1.0.9py3-none-any.whl → 1.1.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (30) hide show

spacr/__init__.py +3 -2
spacr/app_classify.py +10 -0
spacr/app_mask.py +9 -0
spacr/app_measure.py +9 -0
spacr/app_sequencing.py +9 -0
spacr/core.py +172 -1
spacr/deep_spacr.py +296 -7
spacr/gui.py +68 -0
spacr/gui_core.py +319 -10
spacr/gui_elements.py +772 -13
spacr/gui_utils.py +304 -12
spacr/io.py +887 -71
spacr/logger.py +36 -0
spacr/measure.py +206 -28
spacr/ml.py +606 -142
spacr/plot.py +797 -131
spacr/sequencing.py +363 -8
spacr/settings.py +1158 -38
spacr/sp_stats.py +80 -12
spacr/spacr_cellpose.py +115 -2
spacr/submodules.py +747 -19
spacr/timelapse.py +237 -53
spacr/toxo.py +132 -6
spacr/utils.py +2422 -80
{spacr-1.0.9.dist-info → spacr-1.1.1.dist-info}/METADATA +31 -17
{spacr-1.0.9.dist-info → spacr-1.1.1.dist-info}/RECORD +30 -30
{spacr-1.0.9.dist-info → spacr-1.1.1.dist-info}/LICENSE +0 -0
{spacr-1.0.9.dist-info → spacr-1.1.1.dist-info}/WHEEL +0 -0
{spacr-1.0.9.dist-info → spacr-1.1.1.dist-info}/entry_points.txt +0 -0
{spacr-1.0.9.dist-info → spacr-1.1.1.dist-info}/top_level.txt +0 -0

spacr/sp_stats.py CHANGED Viewed

@@ -10,7 +10,7 @@ def choose_p_adjust_method(num_groups, num_data_points):
     """
     Selects the most appropriate p-value adjustment method based on data characteristics.
-    Parameters:
+    Args:
     - num_groups: Number of unique groups being compared
     - num_data_points: Number of data points per group (assuming balanced groups)
@@ -30,7 +30,25 @@ def choose_p_adjust_method(num_groups, num_data_points):
         return 'bonferroni'  # Very conservative, use for strict control of Type I errors
 def perform_normality_tests(df, grouping_column, data_columns):
-    """Perform normality tests for each group and data column."""
+    """
+    Perform normality tests (Shapiro-Wilk or D'Agostino-Pearson) on grouped data.
+    Args:
+        df (pd.DataFrame): Input DataFrame containing the data to test.
+        grouping_column (str): Column name to group data by (e.g., condition or treatment).
+        data_columns (list of str): List of column names containing numeric data to test for normality.
+    Returns:
+        tuple:
+            - is_normal (bool): True if all group-column combinations pass the normality test (p > 0.05), else False.
+            - normality_results (list of dict): List of results for each group-column combination including:
+                - 'Comparison': Description of the test
+                - 'Test Statistic': Computed test statistic (None if skipped)
+                - 'p-value': P-value of the test (None if skipped)
+                - 'Test Name': Name of the test used or 'Skipped'
+                - 'Column': The data column tested
+                - 'n': Sample size
+    """
     unique_groups = df[grouping_column].unique()
     normality_results = []
@@ -77,14 +95,40 @@ def perform_normality_tests(df, grouping_column, data_columns):
 def perform_levene_test(df, grouping_column, data_column):
-    """Perform Levene's test for equal variance."""
+    """
+    Perform Levene’s test for equal variances across groups.
+    Parameters:
+        df (pd.DataFrame): The DataFrame containing the data.
+        grouping_column (str): The column indicating group membership.
+        data_column (str): The column containing the numeric data.
+    Returns:
+        tuple: (statistic, p-value) from Levene’s test.
+    """
     unique_groups = df[grouping_column].unique()
     grouped_data = [df.loc[df[grouping_column] == group, data_column].dropna() for group in unique_groups]
     stat, p_value = levene(*grouped_data)
     return stat, p_value
 def perform_statistical_tests(df, grouping_column, data_columns, paired=False):
-    """Perform statistical tests for each data column."""
+    """
+    Perform statistical tests to compare groups for each specified data column.
+    Parameters:
+        df (pd.DataFrame): The DataFrame containing the data.
+        grouping_column (str): The column indicating group membership.
+        data_columns (list): List of column names to perform tests on.
+        paired (bool): Whether to use paired tests (only for two-group comparisons).
+    Returns:
+        list of dict: Each dict contains:
+            - 'Column': Name of the column tested.
+            - 'Test Name': Statistical test used.
+            - 'Test Statistic': Test statistic value.
+            - 'p-value': P-value of the test.
+            - 'Groups': Number of groups compared.
+    """
     unique_groups = df[grouping_column].unique()
     test_results = []
@@ -125,7 +169,24 @@ def perform_statistical_tests(df, grouping_column, data_columns, paired=False):
 def perform_posthoc_tests(df, grouping_column, data_column, is_normal):
-    """Perform post-hoc tests for multiple groups with both original and adjusted p-values."""
+    """
+    Perform post-hoc pairwise comparisons between groups after a significant overall test (e.g., ANOVA or Kruskal-Wallis).
+    Args:
+        df (pd.DataFrame): Input DataFrame containing the data to analyze.
+        grouping_column (str): Column name representing group membership.
+        data_column (str): Column name with the continuous variable to compare.
+        is_normal (bool): Indicator of whether the data meets normality assumptions
+                          (determines test type: Tukey HSD if True, Dunn's test if False).
+    Returns:
+        list of dict: List of dictionaries summarizing pairwise comparisons, each including:
+            - 'Comparison': Description of the group pair.
+            - 'Original p-value': Raw p-value (None for Tukey HSD).
+            - 'Adjusted p-value': Corrected p-value for multiple testing.
+            - 'Adjusted Method': Method used for p-value adjustment.
+            - 'Test Name': The post-hoc test performed ("Tukey HSD" or "Dunn's Post-hoc").
+    """
     unique_groups = df[grouping_column].unique()
     posthoc_results = []
@@ -164,16 +225,23 @@ def perform_posthoc_tests(df, grouping_column, data_column, is_normal):
 def chi_pairwise(raw_counts, verbose=False):
     """
-    Perform pairwise chi-square or Fisher's exact tests between all unique group pairs
-    and apply p-value correction.
+    Perform pairwise statistical tests (Chi-Square or Fisher's Exact) on contingency tables
+    derived from count data, and apply multiple testing correction.
-    Parameters:
-    - raw_counts (DataFrame): Contingency table with group-wise counts.
-    - verbose (bool): Whether to print results for each pair.
+    Args:
+        raw_counts (pd.DataFrame): A DataFrame where rows represent groups and columns represent categories.
+                                   The values are raw counts.
+        verbose (bool): If True, prints the resulting pairwise test summary.
     Returns:
-    - pairwise_df (DataFrame): DataFrame with pairwise test results, including corrected p-values.
-    """
+        pd.DataFrame: A DataFrame with pairwise comparisons including:
+            - 'Group 1': First group in the comparison
+            - 'Group 2': Second group in the comparison
+            - 'Test Name': Type of statistical test used ('Chi-Square' or 'Fisher's Exact')
+            - 'p-value': Raw p-value for the test
+            - 'p-value_adj': Adjusted p-value after multiple testing correction
+            - 'adj': Name of the correction method used
+    """
     pairwise_results = []
     groups = raw_counts.index.unique()  # Use index from raw_counts for group pairs
     raw_p_values = []  # Store raw p-values for correction later

spacr/spacr_cellpose.py CHANGED Viewed

@@ -66,7 +66,43 @@ def parse_cellpose4_output(output):
     raise ValueError(f"Unrecognized Cellpose flows format: type={type(flows)}, len={len(flows) if hasattr(flows,'__len__') else 'unknown'}")
 def identify_masks_finetune(settings):
+    """
+    Generate Cellpose segmentation masks for a batch of images using a pretrained or custom model.
+    This function loads a set of images from the provided source directory, applies optional
+    preprocessing (normalization, resizing), and uses a Cellpose model to generate segmentation masks.
+    Masks are optionally visualized and saved to disk. The model, channels, and other parameters are
+    defined in the `settings` dictionary.
+    Args:
+        settings (dict): Dictionary containing configuration parameters. Must include:
+            - 'src' (str): Source folder with `.tif` images.
+            - 'model_name' (str): Name of Cellpose model to use (e.g., 'cyto2', 'nucleus').
+            - 'custom_model' (str or None): Path to custom model file (.pt), if used.
+            - 'channels' (list): List of image channel indices to use for segmentation.
+            - 'grayscale' (bool): Whether input images are single-channel.
+            - 'diameter' (float): Estimated diameter of objects in pixels.
+            - 'flow_threshold' (float): Threshold for mask acceptance based on flow prediction.
+            - 'CP_prob' (float): Cell probability threshold for segmentation.
+            - 'rescale' (float): Rescaling factor.
+            - 'resample' (bool): Whether to resample the image during preprocessing.
+            - 'normalize' (bool): Whether to normalize pixel intensities.
+            - 'percentiles' (list): Lower and upper percentiles for normalization.
+            - 'invert' (bool): Whether to invert image intensities.
+            - 'remove_background' (bool): Whether to subtract background value.
+            - 'background' (list): Background pixel intensity values to subtract per channel.
+            - 'Signal_to_noise' (float): Threshold for signal-to-noise filtering.
+            - 'resize' (bool): Whether to resize to fixed target dimensions.
+            - 'target_height' (int): Height for resizing.
+            - 'target_width' (int): Width for resizing.
+            - 'batch_size' (int): Number of images to process per batch.
+            - 'fill_in' (bool): Whether to fill holes in masks.
+            - 'save' (bool): Whether to save the masks to disk.
+            - 'verbose' (bool): Whether to print detailed progress and visualization output.
+    Returns:
+        None. Masks are optionally saved to the 'masks' subdirectory in the source folder.
+    """
     from .plot import print_mask_and_flows
     from .utils import resize_images_and_labels, print_progress, save_settings, fill_holes_in_mask
     from .io import _load_normalized_images_and_labels, _load_images_and_labels
@@ -189,7 +225,35 @@ def identify_masks_finetune(settings):
     return
 def generate_masks_from_imgs(src, model, model_name, batch_size, diameter, cellprob_threshold, flow_threshold, grayscale, save, normalize, channels, percentiles, invert, plot, resize, target_height, target_width, remove_background, background, Signal_to_noise, verbose):
+    """
+    Apply a Cellpose model to a batch of images and generate segmentation masks.
+    Args:
+        src (str): Directory containing input .tif images.
+        model (CellposeModel): Initialized Cellpose model.
+        model_name (str): Model identifier (e.g., 'cyto2', 'nucleus').
+        batch_size (int): Number of images processed in each batch.
+        diameter (float): Estimated object diameter in pixels.
+        cellprob_threshold (float): Cell probability threshold.
+        flow_threshold (float): Flow threshold for mask acceptance.
+        grayscale (bool): If True, treat images as single-channel.
+        save (bool): Whether to save output masks.
+        normalize (bool): Whether to normalize input images.
+        channels (list): Channels to use for processing (e.g., [0, 1]).
+        percentiles (list): Percentiles for normalization (e.g., [2, 99]).
+        invert (bool): If True, invert image intensity.
+        plot (bool): If True, display masks and flows.
+        resize (bool): Whether to resize images to fixed target dimensions.
+        target_height (int): Height after resizing.
+        target_width (int): Width after resizing.
+        remove_background (bool): Whether to subtract background intensity.
+        background (list): Background intensity values for subtraction.
+        Signal_to_noise (float): Minimum SNR threshold.
+        verbose (bool): If True, print detailed status messages.
+    Returns:
+        None. Saves masks to disk if `save=True`.
+    """
     from .io import _load_images_and_labels, _load_normalized_images_and_labels
     from .utils import resize_images_and_labels, resizescikit, print_progress
     from .plot import print_mask_and_flows
@@ -264,7 +328,17 @@ def generate_masks_from_imgs(src, model, model_name, batch_size, diameter, cellp
                 cv2.imwrite(output_filename, mask)
 def check_cellpose_models(settings):
+    """
+    Evaluate multiple pretrained Cellpose models ('cyto', 'nuclei', 'cyto2', 'cyto3')
+    on a given dataset using standardized settings.
+    Args:
+        settings (dict): Dictionary of parameters controlling input source, model parameters,
+                         image preprocessing, and save/visualization options.
+    Returns:
+        None. Runs `generate_masks_from_imgs()` for each model and displays results.
+    """
     from .settings import get_check_cellpose_models_default_settings
     settings = get_check_cellpose_models_default_settings(settings)
@@ -286,7 +360,18 @@ def check_cellpose_models(settings):
     return
 def save_results_and_figure(src, fig, results):
+    """
+    Save a results DataFrame and associated figure to disk.
+    Args:
+        src (str): Path to the source directory where the 'results' subfolder will be created.
+        fig (matplotlib.figure.Figure): The figure object to be saved as a PDF.
+        results (pd.DataFrame or dict or list): Results to be saved. If not a DataFrame,
+                                                it will be converted to one.
+    Returns:
+        None. Writes results to 'results.csv' and the figure to 'model_comparison_plot.pdf'.
+    """
     if not isinstance(results, pd.DataFrame):
         results = pd.DataFrame(results)
@@ -299,6 +384,22 @@ def save_results_and_figure(src, fig, results):
     print(f'Saved figure to {fig_path} and results to {results_path}')
 def compare_mask(args):
+    """
+    Compare segmentation masks across different directories for a given filename
+    using multiple evaluation metrics.
+    Args:
+        args (tuple): A tuple containing:
+            - src (str): Not used directly, reserved for future use.
+            - filename (str): Name of the mask file to compare across directories.
+            - dirs (list of str): List of directory paths where mask files are located.
+            - conditions (list of str): Labels corresponding to each directory for result naming.
+    Returns:
+        dict or None: A dictionary containing comparison metrics (Jaccard index, boundary F1 score,
+                      and average precision) for all pairwise combinations of masks.
+                      Returns None if any mask file is missing.
+    """
     src, filename, dirs, conditions = args
     paths = [os.path.join(d, filename) for d in dirs]
@@ -327,6 +428,18 @@ def compare_mask(args):
     return file_results
 def compare_cellpose_masks(src, verbose=False, processes=None, save=True):
+    """
+    Compare Cellpose segmentation masks across multiple model output folders.
+    Args:
+        src (str): Path to the parent directory containing subdirectories for each model condition.
+        verbose (bool): If True, visualize each mask comparison using matplotlib.
+        processes (int or None): Number of parallel processes to use. If None, uses os.cpu_count().
+        save (bool): Whether to save the visualization outputs and results to disk.
+    Returns:
+        None. Results are printed, plotted, and optionally saved to disk.
+    """
     from .plot import visualize_cellpose_masks, plot_comparison_results
     from .io import _read_mask

spacr 1.0.9__py3-none-any.whl → 1.1.1__py3-none-any.whl

spacr 1.0.9py3-none-any.whl → 1.1.1py3-none-any.whl