PyPI - masster - Versions diffs - 0.5.17__py3-none-any.whl → 0.5.19__py3-none-any.whl - Mend

masster 0.5.17py3-none-any.whl → 0.5.19py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of masster might be problematic. Click here for more details.

Files changed (21) hide show

masster/_version.py +1 -1
masster/sample/adducts.py +12 -0
masster/sample/defaults/find_ms2_def.py +5 -5
masster/sample/defaults/sample_def.py +30 -6
masster/sample/h5.py +59 -13
masster/sample/lib.py +9 -3
masster/sample/load.py +47 -120
masster/sample/processing.py +3 -3
masster/sample/sample.py +5 -3
masster/sample/sciex.py +62 -648
masster/sample/thermo.py +801 -0
masster/study/id.py +3 -1
masster/study/load.py +15 -792
masster/study/study.py +1 -0
masster/wizard/README.md +15 -15
masster/wizard/wizard.py +82 -28
{masster-0.5.17.dist-info → masster-0.5.19.dist-info}/METADATA +3 -2
{masster-0.5.17.dist-info → masster-0.5.19.dist-info}/RECORD +21 -20
{masster-0.5.17.dist-info → masster-0.5.19.dist-info}/WHEEL +0 -0
{masster-0.5.17.dist-info → masster-0.5.19.dist-info}/entry_points.txt +0 -0
{masster-0.5.17.dist-info → masster-0.5.19.dist-info}/licenses/LICENSE +0 -0

masster/_version.py CHANGED Viewed

@@ -1,7 +1,7 @@
 from __future__ import annotations
-__version__ = "0.5.17"
+__version__ = "0.5.19"
 def get_version():

masster/sample/adducts.py CHANGED Viewed

@@ -403,6 +403,7 @@ def find_adducts(self, **kwargs):
     Main parameters (from ``find_adducts_defaults``):
     - adducts (list[str] | str | None): List of potential adduct strings or ionization mode ('pos'/'neg').
+      If None, automatically uses sample.polarity to select appropriate default adducts.
     - charge_min (int): Minimum allowed charge state (default: -4).
     - charge_max (int): Maximum allowed charge state (default: 4).
     - retention_max_diff (float): Maximum RT difference in seconds (default: 1.0).
@@ -431,6 +432,17 @@ def find_adducts(self, **kwargs):
             else:
                 self.logger.warning(f"Unknown parameter {key} ignored")
+    # Auto-set adducts based on sample polarity if not explicitly provided
+    if params.adducts is None and hasattr(self, 'polarity') and self.polarity is not None:
+        if self.polarity.lower() in ['positive', 'pos']:
+            params.set('adducts', 'positive', validate=True)
+            self.logger.debug(f"Auto-set adducts to 'positive' based on sample polarity: {self.polarity}")
+        elif self.polarity.lower() in ['negative', 'neg']:
+            params.set('adducts', 'negative', validate=True)
+            self.logger.debug(f"Auto-set adducts to 'negative' based on sample polarity: {self.polarity}")
+        else:
+            self.logger.debug(f"Unknown sample polarity '{self.polarity}', using default adducts")
     # Check if features_df exists and has data
     if not hasattr(self, "features_df") or len(self.features_df) == 0:
         self.logger.warning(

masster/sample/defaults/find_ms2_def.py CHANGED Viewed

@@ -42,7 +42,7 @@ class find_ms2_defaults:
         - get_description(param_name): Get parameter description
         - get_info(param_name): Get full parameter metadata
         - list_parameters(): Get list of all parameter names
-        - get_mz_tolerance(file_type): Get appropriate m/z tolerance based on file type
+        - get_mz_tolerance(type): Get appropriate m/z tolerance based on type
     """
     # Core MS2 linking parameters
@@ -270,16 +270,16 @@ class find_ms2_defaults:
         return len(invalid_params) == 0, invalid_params
-    def get_mz_tolerance(self, file_type=None):
+    def get_mz_tolerance(self, type=None):
         """
-        Get the appropriate m/z tolerance based on file type.
+        Get the appropriate m/z tolerance based on type.
         Args:
-            file_type (str, optional): File type ('ztscan', 'dia', or other)
+            type (str, optional): Acquisition type ('ztscan', 'dia', or other)
         Returns:
             float: Appropriate m/z tolerance value
         """
-        if file_type is not None and file_type.lower() in ["ztscan", "dia"]:
+        if type is not None and type.lower() in ["ztscan", "dia"]:
             return self.get("mz_tol_ztscan")
         return self.get("mz_tol")

masster/sample/defaults/sample_def.py CHANGED Viewed

@@ -32,30 +32,42 @@ class sample_defaults:
         centroid_prominence (int): Prominence parameter for centroiding. Default is -1.
         max_points_per_spectrum (int): Maximum number of points per spectrum. Default is 50000.
         dia_window (Optional[float]): DIA window size. Default is None.
+        type (str): Acquisition type/mode. Options are 'dda', 'swath', 'ztscan', 'fia'. Default is 'dda'.
+        polarity (Optional[str]): Ionization polarity. Options are None, 'positive', 'negative'. Default is None.
     """
     filename: Optional[str] = None
-    ondisk: bool = False
     label: str | None = None
     log_level: str = "INFO"
     log_label: Optional[str] = ""
     log_sink: str = "sys.stdout"
-    chrom_fwhm: float = 1.0
+    ondisk: bool = False
+    # file and data handling settings
+    type: str = "dda"
+    polarity: str | None = None
+    # chromatographic settings
+    #chrom_fwhm: float = 1.0
+    eic_mz_tol: float = 0.01
+    eic_rt_tol: float = 10.0
+    # mz tolerances
     mz_tol_ms1_da: float = 0.002
     mz_tol_ms2_da: float = 0.005
     mz_tol_ms1_ppm: float = 5.0
     mz_tol_ms2_ppm: float = 10.0
+    # centroiding settings
     centroid_algo: str = "lmp"
     centroid_min_points_ms1: int = 5
     centroid_min_points_ms2: int = 4
     centroid_smooth: int = 5
     centroid_refine: bool = True
     centroid_prominence: int = -1
+    # data retrieval settings
     max_points_per_spectrum: int = 50000
-    dia_window: float | None = None
-    eic_mz_tol: float = 0.01
-    eic_rt_tol: float = 10.0
     _param_metadata: dict[str, dict[str, Any]] = field(
         default_factory=lambda: {
@@ -178,6 +190,18 @@ class sample_defaults:
                 "min_value": 0.2,
                 "max_value": 60.0,
             },
+            "type": {
+                "dtype": str,
+                "description": "Acquisition type/mode",
+                "default": "dda",
+                "allowed_values": ["dda", "swath", "ztscan", "fia"],
+            },
+            "polarity": {
+                "dtype": "Optional[str]",
+                "description": "Ionization polarity",
+                "default": None,
+                "allowed_values": ["positive", "negative"],
+            },
         },
         repr=False,
     )

masster/sample/h5.py CHANGED Viewed

@@ -1,4 +1,4 @@
-import json
+import json
 import os
 import h5py
@@ -94,8 +94,8 @@ def _save_sample5(
             metadata_group.attrs["file_source"] = str(self.file_source)
         else:
             metadata_group.attrs["file_source"] = ""
-        if self.file_type is not None:
-            metadata_group.attrs["file_type"] = str(self.file_type)
+        if hasattr(self, 'type') and self.type is not None:
+            metadata_group.attrs["file_type"] = str(self.type)
         else:
             metadata_group.attrs["file_type"] = ""
         if self.label is not None:
@@ -287,11 +287,41 @@ def _save_sample5(
                     compression="gzip",
                 )
-        # Store parameters as JSON
-        if self.parameters is not None:
-            # Convert parameters dict to JSON string
-            params_json = json.dumps(self.parameters, default=str)
-            metadata_group.attrs["parameters"] = params_json
+        # Store parameters/history as JSON
+        # Always ensure we sync instance attributes to parameters before saving
+        if hasattr(self, 'parameters') and self.parameters is not None:
+            if hasattr(self, 'polarity') and self.polarity is not None:
+                self.parameters.polarity = self.polarity
+            if hasattr(self, 'type') and self.type is not None:
+                self.parameters.type = self.type
+        # Prepare save data
+        save_data = {}
+        # Add parameters as a dictionary
+        if hasattr(self, 'parameters') and self.parameters is not None:
+            save_data["sample"] = self.parameters.to_dict()
+        # Add history data (but ensure it's JSON serializable)
+        if hasattr(self, 'history') and self.history is not None:
+            # Convert any non-JSON-serializable objects to strings/dicts
+            serializable_history = {}
+            for key, value in self.history.items():
+                if key == "sample":
+                    # Use our properly serialized parameters
+                    continue  # Skip, we'll add it from parameters above
+                try:
+                    # Test if value is JSON serializable
+                    json.dumps(value)
+                    serializable_history[key] = value
+                except (TypeError, ValueError):
+                    # Convert to string if not serializable
+                    serializable_history[key] = str(value)
+            save_data.update(serializable_history)
+        # Save as JSON
+        params_json = json.dumps(save_data, indent=2)
+        metadata_group.attrs["parameters"] = params_json
         # Store lib and lib_match - removed (no longer saving lib data)
@@ -363,7 +393,7 @@ def _load_sample5(self, filename: str, map: bool = False):
             else:
                 self.file_source = self.file_path
-            self.file_type = decode_metadata_attr(
+            self.type = decode_metadata_attr(
                 metadata_group.attrs.get("file_type", ""),
             )
             self.label = decode_metadata_attr(metadata_group.attrs.get("label", ""))
@@ -1072,6 +1102,14 @@ def _load_sample5(self, filename: str, map: bool = False):
     # set self.label to basename without extension
     if self.label is None or self.label == "":
         self.label = os.path.splitext(os.path.basename(filename))[0]
+    # Sync instance attributes from loaded parameters
+    if hasattr(self, 'parameters') and self.parameters is not None:
+        if hasattr(self.parameters, 'polarity') and self.parameters.polarity is not None:
+            self.polarity = self.parameters.polarity
+        if hasattr(self.parameters, 'type') and self.parameters.type is not None:
+            self.type = self.parameters.type
     self.logger.info(f"Sample loaded from {filename}")
@@ -1122,7 +1160,7 @@ def _load_sample5_study(self, filename: str, map: bool = False):
             else:
                 self.file_source = self.file_path
-            self.file_type = decode_metadata_attr(
+            self.type = decode_metadata_attr(
                 metadata_group.attrs.get("file_type", ""),
             )
             self.label = decode_metadata_attr(metadata_group.attrs.get("label", ""))
@@ -1810,6 +1848,14 @@ def _load_sample5_study(self, filename: str, map: bool = False):
     # set self.label to basename without extension
     if self.label is None or self.label == "":
         self.label = os.path.splitext(os.path.basename(filename))[0]
+    # Sync instance attributes from loaded parameters
+    if hasattr(self, 'parameters') and self.parameters is not None:
+        if hasattr(self.parameters, 'polarity') and self.parameters.polarity is not None:
+            self.polarity = self.parameters.polarity
+        if hasattr(self.parameters, 'type') and self.parameters.type is not None:
+            self.type = self.parameters.type
     self.logger.info(
         f"Sample loaded successfully from {filename} (optimized for study)",
     )
@@ -2256,7 +2302,7 @@ def create_h5_metadata_group(
     f: h5py.File,
     file_path: Optional[str],
     file_source: Optional[str],
-    file_type: Optional[str],
+    type: Optional[str],
     label: Optional[str],
 ) -> None:
     """
@@ -2266,7 +2312,7 @@ def create_h5_metadata_group(
         f: The HDF5 file object
         file_path: Source file path
         file_source: Original source file path
-        file_type: Source file type
+        type: Source file type
         label: Sample label
     """
     metadata_group = f.create_group("metadata")
@@ -2275,5 +2321,5 @@ def create_h5_metadata_group(
     metadata_group.attrs["file_source"] = (
         str(file_source) if file_source is not None else ""
     )
-    metadata_group.attrs["file_type"] = str(file_type) if file_type is not None else ""
+    metadata_group.attrs["file_type"] = str(type) if type is not None else ""
     metadata_group.attrs["label"] = str(label) if label is not None else ""

masster/sample/lib.py CHANGED Viewed

@@ -71,7 +71,7 @@ def load_lib(self, *args, **kwargs):
     lib_load(self, *args, **kwargs)
-def lib_load(self, csvfile=None, polarity="positive"):
+def lib_load(self, csvfile=None, polarity=None):
     delta_m = {
         "[M+H]+": 1.007276,
         "[M+Na]+": 22.989218,
@@ -97,10 +97,11 @@ def lib_load(self, csvfile=None, polarity="positive"):
     """
     Load target compounds from a CSV file.
     This method reads a CSV file containing target compounds and their properties, such as m/z, retention time (RT),
-    and adducts. It filters the targets based on the specified adducts and returns a DataFrame of the targets.
+    and adducts. It filters the targets based on the specified polarity and returns a DataFrame of the targets.
     Parameters:
         csvfile (str): The path to the CSV file containing target compounds.
-        adducts (list, optional): A list of adducts to filter the targets. Default is ['[M+H]+', '[M+Na]+', '[M+K]+'].
+        polarity (str, optional): Ion polarity to filter adducts ('positive' or 'negative').
+                                  If None, uses the sample's polarity property. Default is None.
     Returns:
         pd.DataFrame: A DataFrame containing the filtered target compounds with columns 'mz', 'rt', 'adduct'.
     """
@@ -220,6 +221,11 @@ def lib_load(self, csvfile=None, polarity="positive"):
     self.lib = self.lib.where(pd.notnull(self.lib), None)
     # find all elements == nan and replace them with None
     self.lib = self.lib.replace({np.nan: None})
+    # Use sample.polarity if polarity parameter is None
+    if polarity is None:
+        polarity = getattr(self, 'polarity', 'positive')
     if polarity is not None:
         if polarity.lower() == "positive":
             self.lib = self.lib[self.lib["z"] > 0]

masster/sample/load.py CHANGED Viewed

@@ -73,7 +73,7 @@ def load(
         filename (str): The path to the file to load. The file must exist and have one of the following extensions:
                         .mzML, .wiff, or .raw.
         ondisk (bool, optional): Indicates whether the file should be treated as on disk. Defaults to False.
-        type (str, optional): Specifies the type of file. If provided and set to 'ztscan' (case-insensitive), the file_type
+        type (str, optional): Specifies the type of file. If provided and set to 'ztscan' (case-insensitive), the type
                                 attribute will be adjusted accordingly. Defaults to None.
         label (Any, optional): An optional label to associate with the loaded file. Defaults to None.
     Raises:
@@ -84,7 +84,7 @@ def load(
             - ".mzml": Calls _load_mzML(filename)
             - ".wiff": Calls _load_wiff(filename)
             - ".raw": Calls _load_raw(filename)
-        After loading, the file_type attribute is set to 'dda', unless the optional 'type' parameter is provided as 'ztscan',
+        After loading, the type attribute is set to 'dda', unless the optional 'type' parameter is provided as 'ztscan',
         in which case it is updated to 'ztscan'. The label attribute is updated if a label is provided.
     """
@@ -109,9 +109,9 @@ def load(
     else:
         raise ValueError("File must be .mzML, .wiff, *.raw, or .sample5")
-    self.file_type = "dda"
+    self.type = "dda"
     if type is not None and type.lower() in ["ztscan"]:
-        self.file_type = "ztscan"
+        self.type = "ztscan"
     if label is not None:
         self.label = label
@@ -167,9 +167,9 @@ def load_noms1(
     else:
         raise ValueError("File must be .mzML, .wiff, *.raw, or .sample5")
-    self.file_type = "dda"
+    self.type = "dda"
     if type is not None and type.lower() in ["ztscan"]:
-        self.file_type = "ztscan"
+        self.type = "ztscan"
     if label is not None:
         self.label = label
@@ -255,6 +255,7 @@ def _load_mzML(
     )
     tdqm_disable = self.log_level not in ["TRACE", "DEBUG", "INFO"]
+    polarity = None
     # iterate over all spectra
     for i, s in tqdm(
         enumerate(omsexp.getSpectra()),  # type: ignore[union-attr]
@@ -262,23 +263,36 @@ def _load_mzML(
         desc=f"{datetime.now().strftime('%Y-%m-%d %H:%M:%S.%f')[:-3]} | INFO     | {self.log_label}Scans",
         disable=tdqm_disable,
     ):
+        # try to get polarity
+        if polarity is None:
+            try:
+                pol = s.getInstrumentSettings().getPolarity()
+                if pol == 1:
+                    polarity = "positive"
+                elif pol == 2:
+                    polarity = "negative"
+            except Exception:
+                pass
         # create a dict
         if s.getMSLevel() == 1:
             cycle += 1
             prec_mz = None
             precursorIsolationWindowLowerMZ = None
             precursorIsolationWindowUpperMZ = None
-            prec_intyensity = None
+            prec_inty = None
             energy = None
         else:
-            prec_mz = s.getPrecursors()[0].getMZ()
+            prec_mz = s.getPrecursors()
+            if len(prec_mz) == 0:
+                continue
+            prec_mz = prec_mz[0].getMZ()
             precursorIsolationWindowLowerMZ = s.getPrecursors()[
                 0
             ].getIsolationWindowLowerOffset()
             precursorIsolationWindowUpperMZ = s.getPrecursors()[
                 0
             ].getIsolationWindowUpperOffset()
-            prec_intyensity = s.getPrecursors()[0].getIntensity()
+            prec_inty = s.getPrecursors()[0].getIntensity()
             # Try to get collision energy from meta values first, fallback to getActivationEnergy()
             try:
                 energy = s.getPrecursors()[0].getMetaValue("collision energy")
@@ -321,7 +335,7 @@ def _load_mzML(
             "prec_mz": prec_mz,
             "prec_mz_min": precursorIsolationWindowLowerMZ,
             "prec_mz_max": precursorIsolationWindowUpperMZ,
-            "prec_inty": prec_intyensity,
+            "prec_inty": prec_inty,
             "energy": energy,
             "feature_uid": -1,
         }
@@ -367,10 +381,11 @@ def _load_mzML(
         },
         infer_schema_length=None,
     )
+    self.polarity = polarity
     self.file_interface = "oms"
     self.ms1_df = ms1_df
     self.label = os.path.basename(filename)
-    if self.file_type != "ztscan":
+    if self.type != "ztscan":
         self.analyze_dda()
@@ -401,7 +416,8 @@ def _load_raw(
         - Updates instance attributes including self.file_path, self.file_obj, self.file_interface, and self.label.
         - Initiates further analysis by invoking analyze_dda().
     """
-    from alpharaw.thermo import ThermoRawData
+    #from alpharaw.thermo import ThermoRawData
+    from masster.sample.thermo import ThermoRawData
     if not filename:
         raise ValueError("Filename must be provided.")
@@ -464,6 +480,13 @@ def _load_raw(
             prec_intyensity = None
             energy = s["nce"]
+        # try to get polarity
+        if self.polarity is None:
+            if s['polarity'] == 'positive':
+                self.polarity = 'positive'
+            elif s['polarity'] == 'negative':
+                self.polarity = 'negative'
         peak_start_idx = s["peak_start_idx"]
         peak_stop_idx = s["peak_stop_idx"]
         peaks = raw_data.peak_df.loc[peak_start_idx : peak_stop_idx - 1]
@@ -564,16 +587,10 @@ def _load_wiff(
     self,
     filename=None,
 ):
-    try:
-        # Use masster's own implementation first
-        from masster.sample.sciex import SciexWiffData as MassterSciexWiffData
+    # Use masster's own implementation first
+    from masster.sample.sciex import SciexWiffData as MassterSciexWiffData
-        SciexWiffDataClass = MassterSciexWiffData
-    except ImportError:
-        # Fallback to alpharaw if masster implementation fails
-        from alpharaw.sciex import SciexWiffData as AlpharawSciexWiffData
-        SciexWiffDataClass = AlpharawSciexWiffData
+    SciexWiffDataClass = MassterSciexWiffData
     if not filename:
         raise ValueError("Filename must be provided.")
@@ -610,7 +627,7 @@ def _load_wiff(
         "mz": pl.Float64,
         "inty": pl.Float64,
     }
+    polarity = None
     # iterate over rows of specs
     tdqm_disable = self.log_level not in ["TRACE", "DEBUG", "INFO"]
     for i, s in tqdm(
@@ -620,6 +637,13 @@ def _load_wiff(
         disable=tdqm_disable,
     ):
         ms_level = s["ms_level"]
+        # try to get polarity
+        if polarity is None:
+            if s['polarity'] == 'positive':
+                polarity = 'positive'
+            elif s['polarity'] == 'negative':
+                polarity = 'negative'
         if ms_level == 1:
             cycle += 1
             prec_mz = None
@@ -723,7 +747,7 @@ def _load_wiff(
     self.file_interface = "alpharaw"
     self.label = os.path.basename(filename)
     self.ms1_df = pl.DataFrame(ms1_df_records, schema=schema)
-    if self.file_type != "ztscan":
+    if self.type != "ztscan":
         self.analyze_dda()
@@ -750,103 +774,6 @@ def _load_featureXML(
     fm = oms.FeatureMap()
     fh.load(filename, fm)
     self._oms_features_map = fm
-    """if self.features_df is None:
-        df = self._oms_features_map.get_df(export_peptide_identifications=False)
-        df = self._clean_features_df(df)
-        # desotope features
-        df = self._features_deisotope(df, mz_tol=0.02, rt_tol=0.5)
-        # update eic
-        df["chrom"] = None
-        mz_tol = 0.01
-        rt_tol = 10
-        # iterate over all rows in df
-        for i, row in df.iterrows():
-            # select data in ms1_df with mz in range [mz_start - mz_tol, mz_end + mz_tol] and rt in range [rt_start - rt_tol, rt_end + rt_tol]
-            d = self.ms1_df.filter(
-                (pl.col("rt") >= row["rt_start"] - rt_tol)
-                & (pl.col("rt") <= row["rt_end"] + rt_tol)
-                & (pl.col("mz") >= row["mz"] - mz_tol)
-                & (pl.col("mz") <= row["mz"] + mz_tol)
-            )
-            # for all unique rt values, find the maximum inty
-            eic_rt = d.group_by("rt").agg(pl.col("inty").max())
-            if len(eic_rt) < 4:
-                continue
-            eic = Chromatogram(
-                eic_rt["rt"].to_numpy(),
-                eic_rt["inty"].to_numpy(),
-                label=f"EIC mz={row['mz']:.4f}",
-                feature_start=row["rt_start"],
-                feature_end=row["rt_end"],
-                feature_apex=row["rt"],
-            ).find_peaks()
-            # set eic in df
-            df.at[i, "chrom"] = eic
-            if len(eic.peak_widths) > 0:
-                df.at[i, "chrom_coherence"] = round(eic.feature_coherence, 3)
-                df.at[i, "chrom_prominence"] = round(
-                    eic.peak_prominences[0], 3
-                )  # eic.peak_prominences[0]
-                df.at[i, "chrom_prominence_scaled"] = round(
-                    eic.peak_prominences[0] / (np.mean(eic.inty) + 1e-10), 3
-                )
-                df.at[i, "chrom_height_scaled"] = round(
-                    eic.peak_heights[0] / (np.mean(eic.inty) + 1e-10), 3
-                )
-        self.features_df = df"""
-'''
-def _load_mzpkl(
-    self,
-    filename="sample.mzpkl",
-    ondisk=False,
-):
-    """
-    Load the mzpkl data file, initialize the experiment attributes, and set up the file object.
-    Parameters:
-        filename (str, optional): The path to the .mzpkl file to be loaded. Defaults to "data.mzpkl".
-        ondisk (bool, optional): A flag indicating whether the data should be loaded for on-disk usage.
-                                    If True, self.ondisk is set to True and an OnDiscMSExperiment is used.
-                                    Otherwise, an MSExperiment is used.
-    Side Effects:
-        - Decompresses and unpickles the specified file.
-        - Sets attributes on self for each key in the loaded data dictionary, except for keys named 'format'.
-        - Renames the attribute 'spectra_df' to 'scans_df' if present.
-        - Initializes self.file_obj as either an OnDiscMSExperiment or MSExperiment based on the ondisk flag.
-        - Checks for an associated featureXML file (with the same base name as the input file) and loads it if found.
-    """
-    if ondisk is True:
-        self.ondisk = True
-    with bz2.BZ2File(filename, "rb") as f:
-        data = pickle.load(f)
-    for k, v in data.items():
-        if k in ["format"]:
-            continue
-        if k == "spectra_df":
-            k = "scans_df"
-    setattr(self, k, v)
-# Import and call internal sanitize function
-from masster.study.load import _sanitize
-_sanitize(self)    if self.ondisk:
-        self.file_obj = oms.OnDiscMSExperiment()
-    else:
-        self.file_obj = oms.MSExperiment()
-    # check if *.featureXML exists
-    featureXML = filename.replace(".mzpkl", ".featureXML")
-    if os.path.exists(featureXML):
-        self._load_featureXML(featureXML)
-'''
 def _wiff_to_dict(
     filename=None,

masster/sample/processing.py CHANGED Viewed

@@ -248,7 +248,7 @@ def get_spectrum(self, scan, **kwargs):
         spect = spect.keep_top(max_peaks)
     if dia_stats:
-        if self.file_type in ["ztscan", "dia"]:
+        if self.type in ["ztscan", "dia", "swath"]:
             spect = self._get_ztscan_stats(
                 spec=spect,
                 scan_uid=scan_uid,
@@ -1028,7 +1028,7 @@ def find_ms2(self, **kwargs):
     - mz_tol (float):
         Precursor m/z tolerance used for matching. The effective tolerance may be
-        adjusted by file type (the defaults class provides ``get_mz_tolerance(file_type)``).
+        adjusted by type (the defaults class provides ``get_mz_tolerance(type)``).
         Default: 0.5 (ztscan/DIA defaults may be larger).
     - centroid (bool):
@@ -1077,7 +1077,7 @@ def find_ms2(self, **kwargs):
     # Extract parameter values
     features = params.get("features")
-    mz_tol = params.get_mz_tolerance(self.file_type)
+    mz_tol = params.get_mz_tolerance(self.type)
     centroid = params.get("centroid")
     deisotope = params.get("deisotope")
     dia_stats = params.get("dia_stats")

masster/sample/sample.py CHANGED Viewed

@@ -240,12 +240,13 @@ class Sample:
         # Initialize label from parameters
         self.label = params.label
+        self.type = params.type  # dda, dia, ztscan
+        self.polarity = params.polarity  # Initialize from parameters, may be overridden during raw file loading
         # this is the path to the original file. It's never sample5
         self.file_source = None
         # this is the path to the object that was loaded. It could be sample5
         self.file_path = None
-        # Type of the file (e.g., mzML, RAW, WIFF, mzpkl)
-        self.file_type = None
         # Interface to handle the file operations (e.g., oms, alpharaw)
         self.file_interface = None
         # The file object once loaded, can be oms.MzMLFile or alpharaw.AlphaRawFile
@@ -327,7 +328,6 @@ class Sample:
     _save_sample5 = _save_sample5
     _load_sample5 = _load_sample5
     # Removed internal-only load methods: _load_featureXML, _load_ms2data, _load_mzML, _load_raw, _load_wiff
     chrom_extract = chrom_extract
     _index_file = _index_file  # Renamed from index_file to be internal-only
@@ -503,6 +503,8 @@ class Sample:
         str = f"File: {os.path.basename(self.file_path)}\n"
         str += f"Path: {os.path.dirname(self.file_path)}\n"
         str += f"Source: {self.file_source}\n"
+        str += f"Type: {self.type}\n"
+        str += f"Polarity: {self.polarity}\n"
         str += f"MS1 scans: {len(self.scans_df.filter(pl.col('ms_level') == 1))}\n"
         str += f"MS2 scans: {len(self.scans_df.filter(pl.col('ms_level') == 2))}\n"
         if self.features_df is not None:

masster 0.5.17__py3-none-any.whl → 0.5.19__py3-none-any.whl

Potentially problematic release.

masster 0.5.17py3-none-any.whl → 0.5.19py3-none-any.whl