PyPI - masster - Versions diffs - 0.5.28__py3-none-any.whl → 0.6.1__py3-none-any.whl - Mend

masster 0.5.28py3-none-any.whl → 0.6.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of masster might be problematic. Click here for more details.

Files changed (31) hide show

masster/_version.py +1 -1
masster/data/libs/aa_nort.json +240 -0
masster/data/libs/ccm_nort.json +1319 -0
masster/lib/lib.py +1 -1
masster/logger.py +0 -6
masster/sample/adducts.py +1 -1
masster/sample/defaults/find_adducts_def.py +1 -1
masster/sample/h5.py +152 -2
masster/sample/helpers.py +91 -5
masster/sample/id.py +1160 -0
masster/sample/importers.py +316 -0
masster/sample/plot.py +175 -71
masster/sample/sample.py +18 -3
masster/sample/sample5_schema.json +99 -1
masster/study/defaults/study_def.py +8 -12
masster/study/export.py +62 -62
masster/study/id.py +59 -12
masster/study/load.py +0 -11
masster/study/merge.py +153 -0
masster/study/plot.py +197 -0
masster/study/study.py +3 -1
masster/study/study5_schema.json +15 -0
masster/wizard/wizard.py +11 -12
{masster-0.5.28.dist-info → masster-0.6.1.dist-info}/METADATA +17 -18
{masster-0.5.28.dist-info → masster-0.6.1.dist-info}/RECORD +28 -27
masster/data/libs/aa.csv +0 -22
masster/data/libs/ccm.csv +0 -120
masster/data/libs/urine.csv +0 -4693
{masster-0.5.28.dist-info → masster-0.6.1.dist-info}/WHEEL +0 -0
{masster-0.5.28.dist-info → masster-0.6.1.dist-info}/entry_points.txt +0 -0
{masster-0.5.28.dist-info → masster-0.6.1.dist-info}/licenses/LICENSE +0 -0

masster/study/merge.py CHANGED Viewed

@@ -441,9 +441,15 @@ def merge(study, **kwargs) -> None:
     cached_valid_adducts = None
     try:
         cached_adducts_df = study._get_adducts()
+        # Remove all adducts with wrong polarity
+        if study.polarity == "positive":
+            cached_adducts_df = cached_adducts_df.filter(pl.col("charge") >= 0)
+        else:
+            cached_adducts_df = cached_adducts_df.filter(pl.col("charge") <= 0)
         if not cached_adducts_df.is_empty():
             cached_valid_adducts = set(cached_adducts_df["name"].to_list())
         else:
+            study.logger.warning(f"No valid adducts found for polarity '{study.polarity}'")
             cached_valid_adducts = set()
     except Exception as e:
         study.logger.warning(f"Could not retrieve study adducts: {e}")
@@ -452,6 +458,13 @@ def merge(study, **kwargs) -> None:
     # Always allow '?' adducts
     cached_valid_adducts.add("?")
+    # Bypass for single sample case
+    if len(study.samples_df) == 1:
+        study.logger.info("Single sample detected - bypassing merge algorithm and using direct feature mapping")
+        _handle_single_sample_merge(study, cached_adducts_df, cached_valid_adducts)
+        # Skip all post-processing for single sample case
+        return
     # Route to algorithm implementation
     if params.method == "kd":
         consensus_map = _merge_kd(study, params)
@@ -1719,6 +1732,10 @@ def _calculate_consensus_statistics(
         mz_values: m/z values from chunk consensus features
         intensity_values: Intensity values from chunk consensus features
         quality_values: Quality values from chunk consensus features
+        number_features: Number of unique features contributing
+        number_samples: Number of unique samples contributing
+        cached_adducts_df: Cached DataFrame of valid adducts for the study
+        cached_valid_adducts: Cached set of valid adduct names for the study
     Returns:
         Dictionary with consensus feature metadata
@@ -3612,6 +3629,142 @@ def __merge_adduct_grouping(study, consensus_data, rt_tol, mz_tol):
     return adduct_group_list, adduct_of_list
+def _handle_single_sample_merge(study, cached_adducts_df=None, cached_valid_adducts=None):
+    """
+    Handle merge for the special case of a single sample.
+    Directly populate consensus_df from the sample's features_df without any filtering.
+    Args:
+        study: Study object with single sample
+        cached_adducts_df: Pre-computed adducts DataFrame (optional)
+        cached_valid_adducts: Set of valid adduct names (optional)
+    """
+    import polars as pl
+    import uuid
+    if len(study.samples_df) != 1:
+        raise ValueError("_handle_single_sample_merge should only be called with exactly one sample")
+    # Get the single sample's features
+    sample_row = study.samples_df.row(0, named=True)
+    sample_uid = sample_row["sample_uid"]
+    # Filter features for this sample
+    sample_features = study.features_df.filter(pl.col("sample_uid") == sample_uid)
+    if len(sample_features) == 0:
+        study.logger.warning("No features found for single sample")
+        study.consensus_df = pl.DataFrame()
+        study.consensus_mapping_df = pl.DataFrame()
+        return
+    study.logger.info(f"Creating consensus from {len(sample_features)} features in single sample")
+    # Create consensus features directly from sample features
+    consensus_list = []
+    mapping_list = []
+    # Cache valid adducts
+    valid_adducts = cached_valid_adducts if cached_valid_adducts is not None else set()
+    valid_adducts.add("?")  # Always allow '?' adducts
+    for i, feature_row in enumerate(sample_features.iter_rows(named=True)):
+        # Generate unique consensus ID
+        consensus_id_str = str(uuid.uuid4()).replace("-", "")[:16]
+        # Handle adduct information
+        adduct = feature_row.get("adduct")
+        if adduct is None or adduct not in valid_adducts:
+            # Set default adduct based on study polarity
+            study_polarity = getattr(study, "polarity", "positive")
+            if study_polarity in ["negative", "neg"]:
+                adduct = "[M-?]1-"
+                adduct_charge = -1
+                adduct_mass_shift = -1.007825
+            else:
+                adduct = "[M+?]1+"
+                adduct_charge = 1
+                adduct_mass_shift = 1.007825
+        else:
+            # Try to get charge and mass shift from cached adducts
+            adduct_charge = 1
+            adduct_mass_shift = 1.007825
+            if cached_adducts_df is not None and not cached_adducts_df.is_empty():
+                matching_adduct = cached_adducts_df.filter(pl.col("name") == adduct)
+                if not matching_adduct.is_empty():
+                    adduct_row = matching_adduct.row(0, named=True)
+                    adduct_charge = adduct_row["charge"]
+                    adduct_mass_shift = adduct_row["mass_shift"]
+        # Calculate neutral mass
+        mz = feature_row.get("mz", 0.0)
+        if adduct_charge and adduct_mass_shift is not None:
+            adduct_mass_neutral = mz * abs(adduct_charge) - adduct_mass_shift
+        else:
+            adduct_mass_neutral = None
+        # Count MS2 scans
+        ms2_scans = feature_row.get("ms2_scans", [])
+        ms2_count = len(ms2_scans) if ms2_scans else 0
+        # Create consensus feature metadata
+        consensus_feature = {
+            "consensus_uid": i,
+            "consensus_id": consensus_id_str,
+            "quality": feature_row.get("quality", 1.0),
+            "number_samples": 1,  # Always 1 for single sample
+            "rt": feature_row.get("rt", 0.0),
+            "mz": mz,
+            "rt_min": feature_row.get("rt", 0.0),
+            "rt_max": feature_row.get("rt", 0.0),
+            "rt_mean": feature_row.get("rt", 0.0),
+            "rt_start_mean": feature_row.get("rt_start", 0.0),
+            "rt_end_mean": feature_row.get("rt_end", 0.0),
+            "rt_delta_mean": feature_row.get("rt_delta", 0.0),
+            "mz_min": mz,
+            "mz_max": mz,
+            "mz_mean": mz,
+            "mz_start_mean": feature_row.get("mz_start", 0.0),
+            "mz_end_mean": feature_row.get("mz_end", 0.0),
+            "inty_mean": feature_row.get("inty", 0.0),
+            "bl": -1.0,
+            "chrom_coherence_mean": feature_row.get("chrom_coherence", 0.0),
+            "chrom_prominence_mean": feature_row.get("chrom_prominence", 0.0),
+            "chrom_prominence_scaled_mean": feature_row.get("chrom_prominence_scaled", 0.0),
+            "chrom_height_scaled_mean": feature_row.get("chrom_height_scaled", 0.0),
+            "iso": None,  # Will be filled by find_iso() function
+            "iso_mean": feature_row.get("iso", 0.0),
+            "charge_mean": feature_row.get("charge", 0.0),
+            "number_ms2": ms2_count,
+            "adducts": [[adduct, 1, 100.0]],  # Single adduct with 100% frequency
+            "adduct_top": adduct,
+            "adduct_charge_top": adduct_charge,
+            "adduct_mass_neutral_top": adduct_mass_neutral,
+            "adduct_mass_shift_top": adduct_mass_shift,
+            "id_top_name": None,
+            "id_top_class": None,
+            "id_top_adduct": None,
+            "id_top_score": None,
+            "id_source": None,
+        }
+        consensus_list.append(consensus_feature)
+        # Create mapping entry
+        mapping_entry = {
+            "consensus_uid": i,
+            "sample_uid": sample_uid,
+            "feature_uid": feature_row.get("feature_uid"),
+        }
+        mapping_list.append(mapping_entry)
+    # Create DataFrames
+    study.consensus_df = pl.DataFrame(consensus_list, strict=False)
+    study.consensus_mapping_df = pl.DataFrame(mapping_list, strict=False)
+    study.logger.info(f"Created {len(consensus_list)} consensus features from single sample")
 def _fast_correlation(x, y):
     """
     Fast correlation coefficient calculation for consensus matrix data.

masster/study/plot.py CHANGED Viewed

@@ -2955,6 +2955,203 @@ def plot_tic(
     return p
+def plot_heatmap(
+    self,
+    filename=None,
+    width=800,
+    height=600,
+    cmap="viridis",
+    title="Consensus Matrix Heatmap",
+    quant="chrom_area",
+    samples=None,
+):
+    """
+    Plot a heatmap of the consensus matrix data.
+    Samples are ordered from left to right, features are ordered by m/z from top to bottom.
+    Values are log10 transformed for better visualization.
+    Parameters:
+        filename (str, optional): Path to save the plot
+        width (int): Plot width in pixels (default: 800)
+        height (int): Plot height in pixels (default: 600)
+        cmap (str): Colormap name (default: "viridis")
+        title (str): Plot title (default: "Consensus Matrix Heatmap")
+        quant (str): Quantification method column name (default: "chrom_area")
+        samples: Sample identifier(s) to include. Can be:
+                - None: include all samples (default)
+                - int: single sample_uid
+                - str: single sample_name
+                - list: multiple sample_uids or sample_names
+    """
+    from bokeh.plotting import figure
+    from bokeh.models import LinearColorMapper, ColorBar, BasicTicker
+    from bokeh.transform import transform
+    import numpy as np
+    import pandas as pd
+    # Get consensus matrix
+    matrix_df = self.get_consensus_matrix(quant=quant, samples=samples)
+    if matrix_df is None or matrix_df.is_empty():
+        self.logger.error("No consensus matrix available for heatmap.")
+        return
+    # Get m/z values for each consensus_uid to sort by
+    if self.consensus_df is None or self.consensus_df.is_empty():
+        self.logger.error("No consensus_df available for sorting features by m/z.")
+        return
+    # Join with consensus_df to get m/z values
+    matrix_with_mz = matrix_df.join(
+        self.consensus_df.select(["consensus_uid", "mz"]),
+        on="consensus_uid",
+        how="left",
+    )
+    # Sort by m/z (ascending - lowest m/z at top)
+    matrix_with_mz = matrix_with_mz.sort("mz")
+    # Remove the m/z column after sorting
+    matrix_sorted = matrix_with_mz.drop("mz")
+    # Extract consensus_uid and sample columns
+    consensus_uids = matrix_sorted["consensus_uid"].to_list()
+    sample_cols = [col for col in matrix_sorted.columns if col != "consensus_uid"]
+    # Convert to pandas for easier heatmap processing
+    matrix_pd = matrix_sorted.select(sample_cols).to_pandas()
+    # Apply log10 transformation (add 1 to avoid log(0))
+    matrix_log = np.log10(matrix_pd.values + 1)
+    # Prepare data for Bokeh heatmap
+    # Create a list of (sample, feature, value) tuples
+    heatmap_data = []
+    for i, feature_idx in enumerate(range(len(consensus_uids))):
+        for j, sample in enumerate(sample_cols):
+            value = matrix_log[feature_idx, j]
+            heatmap_data.append({
+                "sample": sample,
+                "feature": str(consensus_uids[feature_idx]),
+                "feature_idx": str(i),  # Use string index for y-axis position
+                "value": value,
+            })
+    # Convert to DataFrame for Bokeh ColumnDataSource
+    heatmap_df = pd.DataFrame(heatmap_data)
+    from bokeh.models import ColumnDataSource
+    source = ColumnDataSource(heatmap_df)
+    # Handle colormap using cmap.Colormap
+    try:
+        # Get colormap palette using cmap
+        if isinstance(cmap, str):
+            colormap = Colormap(cmap)
+            # Generate 256 colors and convert to hex
+            import matplotlib.colors as mcolors
+            colors = colormap(np.linspace(0, 1, 256))
+            palette = [mcolors.rgb2hex(color) for color in colors]
+        else:
+            colormap = cmap
+            # Try to use to_bokeh() method first
+            try:
+                palette = colormap.to_bokeh()
+                # Ensure we got a color palette, not another mapper
+                if not isinstance(palette, (list, tuple)):
+                    # Fall back to generating colors manually
+                    import matplotlib.colors as mcolors
+                    colors = colormap(np.linspace(0, 1, 256))
+                    palette = [mcolors.rgb2hex(color) for color in colors]
+            except AttributeError:
+                # Fall back to generating colors manually
+                import matplotlib.colors as mcolors
+                colors = colormap(np.linspace(0, 1, 256))
+                palette = [mcolors.rgb2hex(color) for color in colors]
+    except (AttributeError, ValueError, TypeError) as e:
+        # Fallback to viridis if cmap interpretation fails
+        self.logger.warning(f"Could not interpret colormap '{cmap}': {e}, falling back to viridis")
+        from bokeh.palettes import viridis
+        palette = viridis(256)
+    # Create color mapper
+    color_mapper = LinearColorMapper(
+        palette=palette,
+        low=heatmap_df["value"].min(),
+        high=heatmap_df["value"].max(),
+    )
+    # Create figure with categorical ranges for both axes
+    p = figure(
+        width=width,
+        height=height,
+        title=title,
+        x_range=sample_cols,
+        y_range=[str(i) for i in range(len(consensus_uids))],
+        toolbar_location="above",
+        tools="pan,wheel_zoom,box_zoom,reset,save,hover",
+        tooltips=[
+            ("Sample", "@sample"),
+            ("Feature UID", "@feature"),
+            ("log10(Value+1)", "@value{0.00}"),
+        ],
+    )
+    # Draw rectangles for heatmap
+    p.rect(
+        x="sample",
+        y="feature_idx",
+        width=1,
+        height=1,
+        source=source,
+        fill_color=transform("value", color_mapper),
+        line_color=None,
+    )
+    # Add colorbar
+    color_bar = ColorBar(
+        color_mapper=color_mapper,
+        width=8,
+        location=(0, 0),
+        title=f"log10({quant}+1)",
+        ticker=BasicTicker(desired_num_ticks=8),
+    )
+    p.add_layout(color_bar, "right")
+    # Style the plot
+    p.axis.axis_line_color = None
+    p.axis.major_tick_line_color = None
+    p.grid.grid_line_color = None
+    p.xaxis.major_label_orientation = 45
+    p.yaxis.axis_label = "Features (sorted by m/z)"
+    p.xaxis.axis_label = "Samples"
+    # Apply consistent save/display behavior
+    if filename is not None:
+        # Convert relative paths to absolute paths using study folder as base
+        import os
+        if not os.path.isabs(filename):
+            filename = os.path.join(self.folder, filename)
+        # Convert to absolute path for logging
+        abs_filename = os.path.abspath(filename)
+        # Use isolated file saving
+        _isolated_save_plot(p, filename, abs_filename, self.logger, "Heatmap Plot")
+    else:
+        # Show in notebook when no filename provided
+        _isolated_show_notebook(p)
+    return p
 def plot_pca(self, *args, **kwargs):
     """Deprecated: Use plot_samples_pca instead."""
     import warnings

masster/study/study.py CHANGED Viewed

@@ -14,7 +14,7 @@ Main class:
         consensus_select/filter/delete
     - Retrieval: get_consensus, get_chrom, get_samples, get_*_stats, get_*_matrix
     - Plotting: plot_alignment, plot_samples_pca/umap/2d, plot_tic/bpc/eic, plot_chrom,
-        plot_rt_correction, plot_consensus_2d/stats
+        plot_rt_correction, plot_consensus_2d/stats, plot_heatmap
     - Export: export_mgf, export_mztab, export_xlsx, export_parquet
     - Identification: lib_load, identify, get_id, id_reset, lib_reset
     - Parameters: get/update parameters, update_history
@@ -96,6 +96,7 @@ from masster.study.plot import plot_bpc
 from masster.study.plot import plot_tic
 from masster.study.plot import plot_eic
 from masster.study.plot import plot_rt_correction
+from masster.study.plot import plot_heatmap
 from masster.study.processing import align
 from masster.study.merge import merge
 from masster.study.processing import integrate
@@ -429,6 +430,7 @@ class Study:
     plot_rt_correction = plot_rt_correction
     plot_tic = plot_tic
     plot_eic = plot_eic
+    plot_heatmap = plot_heatmap
     # === Analysis Operations ===
     analyze_umap = analyze_umap

masster/study/study5_schema.json CHANGED Viewed

@@ -261,6 +261,21 @@
       },
       "ms1_spec": {
         "dtype": "pl.Object"
+      },
+      "id_top_name": {
+        "dtype": "pl.Utf8"
+      },
+      "id_top_class": {
+        "dtype": "pl.Utf8"
+      },
+      "id_top_adduct": {
+        "dtype": "pl.Utf8"
+      },
+      "id_top_score": {
+        "dtype": "pl.Float64"
+      },
+      "id_source": {
+        "dtype": "pl.Utf8"
       }
     }
   },

masster/wizard/wizard.py CHANGED Viewed

@@ -200,12 +200,12 @@ class wizard_def:
         # Set default adducts based on polarity if not provided
         if not self.adducts:
             if self.polarity and self.polarity.lower() in ["positive", "pos"]:
-                self.adducts = ["H:+:0.8", "Na:+:0.1", "NH4:+:0.1"]
+                self.adducts = ["+H:1:0.8", "+Na:1:0.1", "+NH4:1:0.1"]
             elif self.polarity and self.polarity.lower() in ["negative", "neg"]:
-                self.adducts = ["H-1:-:1.0", "CH2O2:0:0.5"]
+                self.adducts = ["-H:-1:1.0", "+CH2O2:0:0.5"]
             else:
                 # Default to positive if polarity is None or unknown
-                self.adducts = ["H:+:0.8", "Na:+:0.1", "NH4:+:0.1"]
+                self.adducts = ["+H:1:0.8", "+Na:1:0.1", "+NH4:1:0.1"]
         # Validate num_cores
         max_cores = multiprocessing.cpu_count()
@@ -676,9 +676,7 @@ class Wizard:
             "        ",
             "        # Step 3: Create and configure study",
             '        print("\\nStep 3/7: Initializing study...")',
-            "        study = Study(folder=PARAMS['folder'])",
-            "        study.polarity = PARAMS['polarity']",
-            "        study.adducts = PARAMS['adducts']",
+            "        study = Study(folder=PARAMS['folder'], polarity=PARAMS['polarity'], adducts=PARAMS['adducts'])",
             "        ",
             "        # Step 4: Add sample5 files to study",
             '        print("\\nStep 4/7: Adding samples to study...")',
@@ -692,6 +690,12 @@ class Wizard:
             "            rt_tol=PARAMS['rt_tol']",
             "        )",
             "        ",
+            "        # Check that more than 1 file has been loaded",
+            "        if len(study.samples) <= 1:",
+            '            print("\\nWARNING: Study merging requires more than 1 sample file.")',
+            '            print(f"Only {len(study.samples)} sample(s) loaded. Terminating execution.")',
+            "            return False",
+            "        ",
             "        study.merge(",
             '            method="qt",',
             "            min_samples=PARAMS['min_samples_per_feature'],",
@@ -764,14 +768,9 @@ class Wizard:
             'app = marimo.App(width="medium")',
             "",
             "@app.cell",
-            "def __():",
-            "    import marimo as mo",
-            "    return (mo,)",
-            "",
-            "@app.cell",
             "def __(mo):",
             '    mo.md(r"""',
-            "    # MASSter Interactive Analysis",
+            "    ## MASSter Interactive Analysis",
             "    ",
             f"    **Source:** {source_info.get('number_of_files', 0)} files detected",
             f"    **Polarity:** {source_info.get('polarity', 'unknown')}",

{masster-0.5.28.dist-info → masster-0.6.1.dist-info}/METADATA RENAMED Viewed

@@ -1,12 +1,12 @@
 Metadata-Version: 2.4
 Name: masster
-Version: 0.5.28
+Version: 0.6.1
 Summary: Mass spectrometry data analysis package
 Project-URL: homepage, https://github.com/zamboni-lab/masster
 Project-URL: repository, https://github.com/zamboni-lab/masster
 Project-URL: documentation, https://github.com/zamboni-lab/masster#readme
 Project-URL: Third-Party Licenses, https://github.com/zamboni-lab/masster/blob/main/THIRD_PARTY_NOTICES.md
-Author: Zamboni Lab
+Author: Zamboni Lab, ETH Zurich
 License:                     GNU AFFERO GENERAL PUBLIC LICENSE
                                Version 3, 19 November 2007
@@ -734,19 +734,19 @@ Description-Content-Type: text/markdown
 ## Background and motivation
-MASSter is actively used, maintainted, and developed by the Zamboni Lab at ETH Zurich. The project started because many needs of were unmatched by the "usual" software packages (mzmine, msdial, W4M, ...), e.g. performance, scalability, sensitivity, robustness, speed, rapid implementation of new features, embedding in ETL systems, and so on.
+MASSter is actively used, maintained, and developed by the Zamboni Lab at ETH Zurich. The project started because many needs were unmet by the "usual" software packages (mzMine, MS-DIAL, Workflow4Metabolomics (W4M), ...), for example performance, scalability, sensitivity, robustness, speed, rapid implementation of new features, and embedding in ETL systems.
-All methods include a long list of parameters, and might wrap alternative algorithms. These are only relevant for advanced users. We recommend running the processing methods with defaults, or using the Wizard.
+All methods include many parameters and may wrap alternative algorithms. These options are primarily relevant for advanced users. We recommend running the processing methods with the defaults or using the Wizard.
 ## Content
 MASSter is designed to deal with DDA data, and hides functionalities for DIA and ZTScan DIA data. The sample-centric feature detection uses OpenMS, which is both accurate and fast, and it was wrapped with additional code to improve isotope and adduct detection. All other functionalities are own implementations: centroiding, RT alignment, adduct and isotopomer detection, merging of multiple samples, gap-filling, quantification, etc.
-MASSter was engineered to maximize quality of results, sensitivity, scalability, and also speed. Yes, it's Python which is notoriously slower than other languages, but considerable time was spent in speeding up everything, including the systematic use of [polars](https://pola.rs/), numpy vectorization, multiprocessing, chunking, etc. MASSter was tested with studies with 3000+ LC-MS/MS samples (1 Mio MS2 spectra), and it autonomously completed analysis within a few hours.
+MASSter was engineered to maximize result quality, sensitivity, scalability, and speed. Yes, it's Python, which can be slower than other languages, but considerable effort was spent on optimizations, including the systematic use of [Polars](https://pola.rs/), NumPy vectorization, multiprocessing, and chunking. MASSter has been tested on studies with 3,000+ LC–MS/MS samples (≈1 million MS2 spectra) and autonomously completed analyses within a few hours.
 ## Architecture
-MASSter defines own classes for Spectra, Chromatograms, Libraries, Samples, and Studies (= bunch of samples, i.e. a LC-MS sequence). Users will deal mostly with one Study() object at the time. Sample() objects are created when analyzing a batch - and saved for caching -, or will be used only for development, troubleshooting, or to generate illustrations.
+MASSter defines classes for Spectra, Chromatograms, Libraries, Samples, and Studies (a Study is a collection of samples, i.e. an LC–MS sequence). Users will typically work with a single `Study` object at a time. `Sample` objects are created when analyzing a batch (and saved for caching), or used for development, troubleshooting, or generating illustrations.
 The analysis can be done in scripts (without user intervention, e.g. by the integrated Wizard), or interactively in notebooks, i.e. [marimo](https://marimo.io/) or [jupyter](https://jupyter.org/).
@@ -756,9 +756,9 @@ You'll need to install Python (3.10-3.13, 3.14 has not been tested yet).
 MASSter reads raw (Thermo), wiff (SCIEX), or mzML data. Reading vendor formats relies on .NET libraries, and is only possible in Windows. On Linux or MacOS, you'll be forced to use mzML data.
-**It's recommended to use data in either vendor's raw format (wiff and raw) or mzML in profile data.** MASSter includes a sophisticated and sufficiently fast centroiding algorithm that works well across the full dynamic range and will only act on the spectra that are relevant. In our tests with data from different vendors, the centroiding performed much better than most Vendor's implementations (that are primarily proteomics-centric).
+**It's recommended to use data in either the vendor's raw formats (WIFF and Thermo RAW) or mzML in profile mode.** MASSter includes a sophisticated and sufficiently fast centroiding algorithm that works well across the full dynamic range and will only act on spectra that are relevant. In our tests with data from different vendors, the centroiding performed much better than most vendor implementations (which are primarily proteomics-centric).
-If still want to convert raw data to centroided mzML, please use (CentroidR)[https://github.com/Adafede/CentroidR/tree/0.0.0.9001].
+If you still want to convert raw data to centroided mzML, please use CentroidR: https://github.com/Adafede/CentroidR/tree/0.0.0.9001
 ## Installation
@@ -769,7 +769,7 @@ pip install masster
 ## Getting started
 **The quickest way to use, or learn how to use MASSter, is to use the Wizard** which we integrated and, ideally, takes care of everything automatically.
-The Wizard only needs to know where to find the MS files and were the store the results.
+The Wizard only needs to know where to find the MS files and where to store the results.
 ```python
 from masster import Wizard
 wiz = Wizard(
@@ -780,15 +780,15 @@ wiz = Wizard(
 wiz.test_and_run()
 ```
-This will trigger the analysis of raw data, and the creation of a script to process all samples and then assemble the study. The whole processing will be stored as `1_masster_workflow.py` in the output folder. The wizard will test once and, if successull, run the full workflow using parallel processes. Once the processing is over you, navigate to `folder` to see what happened...
+This will trigger the analysis of raw data, and the creation of a script to process all samples and then assemble the study. The whole processing will be stored as `1_masster_workflow.py` in the output folder. The wizard will test once and, if successful, run the full workflow using parallel processes. Once the processing is over you, navigate to `folder` to see what happened...
 If you want to interact with your data, we recommend using [marimo](https://marimo.io/) or [jupyter](https://jupyter.org/) and open the `*.study5` file, for example:
 ```bash
-# use marimo to open the script created by marino
-marimo edit '..\..folder_to_store_results\2_interactive_analysis.py'
-# or, if you use uv to manage an environment with masster
-uv run marimo edit '..\..folder_to_store_results\2_interactive_analysis.py'
+# use marimo to open the script created by marimo
+marimo edit '..\\..\\folder_to_store_results\\2_interactive_analysis.py'
+# or, if you use uv to manage an environment with masster
+uv run marimo edit '..\\..\\folder_to_store_results\\2_interactive_analysis.py'
 ```
 ### Basic Workflow for analyzing LC-MS study with 1-1000+ samples
@@ -833,6 +833,7 @@ study.save()
 study.plot_samples_pca()
 study.plot_samples_umap()
 study.plot_samples_2d()
+study.plot_heatmap()
 # To know more about the available methods...
 dir(study)
@@ -874,7 +875,7 @@ sample.plot_2d()
 sample.plot_features_stats()
 # explore methods
-dir(study)
+dir(sample)
 ```
 ## Disclaimer
@@ -885,11 +886,9 @@ dir(study)
 - **Backward compatibility**: We do not guarantee backward compatibility between versions. Breaking changes may occur as we improve the software
 - **Performance**: While optimized for our workflows, performance may vary depending on your data and system configuration
 - **Results**: We do our best to ensure accuracy, but you should validate results independently for your research
-- **Support**: This is an academic project with limited resources. Community support is available through GitHub issues, but we cannot guarantee response times
+- **Support**: This is an academic project with limited resources. At the moment, we do not provide external user support.
 - **Production use**: If you plan to use MASSter in production or critical workflows, thorough testing with your data is recommended
-We welcome feedback, bug reports, and contributions via GitHub!
 ## License
 GNU Affero General Public License v3

masster 0.5.28__py3-none-any.whl → 0.6.1__py3-none-any.whl

Potentially problematic release.

masster 0.5.28py3-none-any.whl → 0.6.1py3-none-any.whl