PyPI - masster - Versions diffs - 0.2.5__py3-none-any.whl → 0.3.1__py3-none-any.whl - Mend

masster 0.2.5py3-none-any.whl → 0.3.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of masster might be problematic. Click here for more details.

Files changed (55) hide show

masster/__init__.py +27 -27
masster/_version.py +17 -17
masster/chromatogram.py +497 -503
masster/data/examples/2025_01_14_VW_7600_LpMx_DBS_CID_2min_TOP15_030msecMS1_005msecReac_CE35_DBS-ON_3.featureXML +199787 -0
masster/data/examples/2025_01_14_VW_7600_LpMx_DBS_CID_2min_TOP15_030msecMS1_005msecReac_CE35_DBS-ON_3.sample5 +0 -0
masster/logger.py +318 -244
masster/sample/__init__.py +9 -9
masster/sample/defaults/__init__.py +15 -15
masster/sample/defaults/find_adducts_def.py +325 -325
masster/sample/defaults/find_features_def.py +366 -366
masster/sample/defaults/find_ms2_def.py +285 -285
masster/sample/defaults/get_spectrum_def.py +314 -318
masster/sample/defaults/sample_def.py +374 -378
masster/sample/h5.py +1321 -1297
masster/sample/helpers.py +833 -364
masster/sample/lib.py +762 -0
masster/sample/load.py +1220 -1187
masster/sample/parameters.py +131 -131
masster/sample/plot.py +1685 -1622
masster/sample/processing.py +1402 -1416
masster/sample/quant.py +209 -0
masster/sample/sample.py +393 -387
masster/sample/sample5_schema.json +181 -181
masster/sample/save.py +737 -736
masster/sample/sciex.py +1213 -0
masster/spectrum.py +1287 -1319
masster/study/__init__.py +9 -9
masster/study/defaults/__init__.py +21 -19
masster/study/defaults/align_def.py +267 -267
masster/study/defaults/export_def.py +41 -40
masster/study/defaults/fill_chrom_def.py +264 -264
masster/study/defaults/fill_def.py +260 -0
masster/study/defaults/find_consensus_def.py +256 -256
masster/study/defaults/find_ms2_def.py +163 -163
masster/study/defaults/integrate_chrom_def.py +225 -225
masster/study/defaults/integrate_def.py +221 -0
masster/study/defaults/merge_def.py +256 -0
masster/study/defaults/study_def.py +272 -269
masster/study/export.py +674 -287
masster/study/h5.py +1406 -886
masster/study/helpers.py +1713 -433
masster/study/helpers_optimized.py +317 -0
masster/study/load.py +1231 -1078
masster/study/parameters.py +99 -99
masster/study/plot.py +632 -645
masster/study/processing.py +1057 -1046
masster/study/save.py +161 -134
masster/study/study.py +612 -522
masster/study/study5_schema.json +253 -241
{masster-0.2.5.dist-info → masster-0.3.1.dist-info}/METADATA +15 -10
masster-0.3.1.dist-info/RECORD +59 -0
{masster-0.2.5.dist-info → masster-0.3.1.dist-info}/licenses/LICENSE +661 -661
masster-0.2.5.dist-info/RECORD +0 -50
{masster-0.2.5.dist-info → masster-0.3.1.dist-info}/WHEEL +0 -0
{masster-0.2.5.dist-info → masster-0.3.1.dist-info}/entry_points.txt +0 -0

masster/sample/quant.py ADDED Viewed

@@ -0,0 +1,209 @@
+# a module for the reproducible quantification of EIC traces.
+# it takes a study and a list of features indicated either as MS1 or MRM features
+import os
+import pandas as pd
+# from .parameters import QuantParameters
+# Parameters removed - using hardcoded defaults
+def chrom_from_csv(
+    self,
+    filename=None,
+):
+    """
+    Load MRM transitions from a file.
+    :param filename: Path to the file containing MRM transitions.
+    :return: List of MRM transitions
+    """
+    # if filename exists and ends with csv, read it as a CSV file
+    if filename and filename.endswith(".csv"):
+        df = pd.read_csv(filename, comment="#")
+        # possible columns are name, class, q1, q3, rt, istd. Make sure to handle upper and lower case.
+        df.columns = [col.lower() for col in df.columns]
+        if "name" not in df.columns:
+            raise ValueError("CSV file must contain a 'name' column.")
+        if "q1" in df.columns:
+            col_q1 = "q1"
+        elif "precursor" in df.columns:
+            col_q1 = "precursor"
+        elif "precursor_mz" in df.columns:
+            col_q1 = "precursor_mz"
+        else:
+            raise ValueError("CSV file must contain a 'q1' column or equivalent.")
+        if "q3" in df.columns:
+            col_q3 = "q3"
+        elif "product" in df.columns:
+            col_q3 = "product"
+        elif "product_mz" in df.columns:
+            col_q3 = "product_mz"
+        else:
+            col_q3 = None
+        col_rt = "rt" if "rt" in df.columns else None
+        col_istd = "istd" if "istd" in df.columns else None
+        col_class = "class" if "class" in df.columns else None
+        col_adduct = "adduct" if "adduct" in df.columns else None
+        col_qid = "qid" if "qid" in df.columns else None
+        col_group = "group" if "group" in df.columns else None
+        col_formula = "formula" if "formula" in df.columns else None
+        col_inchikey = "inchikey" if "inchikey" in df.columns else None
+        col_smiles = "smiles" if "smiles" in df.columns else None
+        traces = []
+        for _, row in df.iterrows():
+            traces.append({
+                "chid": row[col_qid],
+                "type": "mrm",
+                "name": row["name"],
+                "group": row[col_group],
+                "prec_mz": row[col_q1],
+                "prod_mz": row[col_q3] if col_q3 else None,
+                "rt": row[col_rt],
+                "rt_start": None,
+                "rt_end": None,
+                "istd": row[col_istd] if col_istd else None,
+                "adduct": row[col_adduct] if col_adduct else None,
+                "class": row[col_class] if col_class else None,
+                "formula": row[col_formula] if col_formula else None,
+                "inchikey": row[col_inchikey] if col_inchikey else None,
+                "smiles": row[col_smiles] if col_smiles else None,
+            })
+        self.chrom_df = pd.DataFrame(traces)
+        return
+def chrom_from_oracle(
+    self,
+    oracle_folder=None,
+    classes=None,
+    level=None,
+):
+    if level is None:
+        level = [2]
+    if oracle_folder is None:
+        return
+    # try to read the annotationfile as a csv file and add it to feats
+    try:
+        oracle_data = pd.read_csv(
+            os.path.join(oracle_folder, "diag", "annotation_full.csv"),
+        )
+    except:
+        print(f"Could not read {oracle_folder}/diag/annotation_full.csv")
+        return
+    # if classes is not None, filter the oracle_data by classe
+    traces = []
+    cols_to_keep = [
+        "mz",
+        "rt",
+        "level",
+        "formula",
+        "ion",
+        "name",
+        "hg",
+        "ms2_matched",
+        "ms2_missed",
+    ]
+    qid = 0
+    oracle_data = oracle_data[cols_to_keep]
+    # keep only MS2 features
+    oracle_data["lib_frags"] = None
+    for i, row in oracle_data.iterrows():
+        if row["level"] in level:
+            if classes is not None and row["hg"] not in classes:
+                continue
+        if row["level"] == 2:
+            frags = {}
+            if row["ms2_matched"] is not None:
+                if isinstance(row["ms2_matched"], str):
+                    # split the ms2_matched column by semicolon
+                    tokens = row["ms2_matched"].split("  ")
+                    for token in tokens:
+                        if token.strip():
+                            frag = token.split("|")
+                            if len(frag) > 1:
+                                # add to dictionary with frag[2] as key and frag[1] as value
+                                frags[frag[1]] = float(frag[0])
+            if row["ms2_missed"] is not None:
+                if isinstance(row["ms2_missed"], str):  # frag[0]
+                    tokens = row["ms2_missed"].split("  ")
+                    for token in tokens:
+                        if token.strip():
+                            frag = token.split("|")
+                            if len(frag) > 1:
+                                # add to dictionary with frag[2] as key and frag[1] as value
+                                frags[frag[1]] = float(frag[0])
+            if len(frags) > 0:
+                oracle_data.at[i, "lib_frags"] = frags
+                for _key, value in frags.items():
+                    # add the fragment to the row
+                    traces.append({
+                        "chid": qid,
+                        "type": "mrm",
+                        "name": row["name"] + " " + row["ion"],
+                        "group": row["name"] + " " + row["ion"],
+                        "prec_mz": row["mz"],
+                        "prod_mz": value,
+                        "rt": row["rt"],
+                        "rt_start": None,
+                        "rt_end": None,
+                        "istd": None,
+                        "adduct": row["ion"],
+                        "class": row["hg"],
+                        "formula": row["formula"],
+                        "inchikey": None,
+                        "smiles": None,
+                    })
+                    qid += 1
+    self.chrom_df = pd.DataFrame(traces)
+    return
+def chrom_from_features(
+    self,
+    feature_uid=None,
+):
+    """
+    Create a chromatogram from features.
+    :param feature_uid: Feature UID to create the chromatogram for. If None, create chromatograms for all features.
+    :return: None
+    """
+    traces = []
+    chid = 0
+    if feature_uid is None:
+        feature_uid = self.features_df["feature_uid"].unique()
+    else:
+        # ensure feature_uid is a list
+        if not isinstance(feature_uid, list | tuple):
+            feature_uid = [feature_uid]
+    for _i, row in self.features_df.iterrows():
+        if row["feature_uid"] not in feature_uid:
+            continue
+        traces.append({
+            "chid": chid,
+            "type": "ms1",
+            "name": f"MS1 fid:{row['feature_uid']} ({row['mz']:.4f})",
+            "group": f"fid:{row['feature_uid']}",
+            "prec_mz": row["mz"],
+            "prod_mz": None,
+            "rt": row["rt"],
+            "rt_start": row["rt_start"],
+            "rt_end": row["rt_end"],
+            "istd": None,
+            "adduct": None,
+            "class": None,
+            "formula": None,
+            "inchikey": None,
+            "smiles": None,
+        })
+        chid += 1
+    self.chrom_df = pd.DataFrame(traces)
+    return

masster 0.2.5__py3-none-any.whl → 0.3.1__py3-none-any.whl

Potentially problematic release.

masster 0.2.5py3-none-any.whl → 0.3.1py3-none-any.whl