PyPI - DeConveil - Versions diffs - 0.1.2__py3-none-any.whl → 0.1.3__py3-none-any.whl - Mend

DeConveil 0.1.2py3-none-any.whl → 0.1.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

deconveil/__version__.py CHANGED Viewed

	@@ -1 +1 @@
1	- __version__ = "0.1.2"
1	+ __version__ = "0.1.3"

deconveil/utils_processing.py CHANGED Viewed

@@ -5,11 +5,93 @@ from pathlib import Path
 import numpy as np
 import pandas as pd
+import deconveil
 from typing import List, Literal, Optional, Dict, Any, cast
+def load_test_data(
+    modality: Literal["rna", "cnv", "metadata", "cnv_tumor"] = "rna",
+    dataset: Literal["tcga_brca"] = "tcga_brca",
+    debug: bool = False,
+    debug_seed: int = 42,
+) -> pd.DataFrame:
+    """Load TCGA-BRCA example data from the DeConveil package.
+    Parameters
+    ----------
+    modality : {"rna", "cnv", "metadata", "cnv_tumor"}
+        Type of data to load.
+    dataset : {"tcga_brca"}
+        Dataset name. Only "tcga_brca" is currently supported.
+    debug : bool, optional
+        If True, randomly subsample 10 samples and 100 features (if applicable).
+        Default is False.
+    debug_seed : int, optional
+        Random seed for reproducibility of debug subsampling. Default is 42.
+    Returns
+    -------
+    pandas.DataFrame
+        The requested data modality as a DataFrame.
+    """
+    assert modality in ["rna", "cnv", "metadata", "cnv_tumor"], (
+        "modality must be one of: 'rna', 'cnv', 'metadata', 'cnv_tumor'"
+    )
+    assert dataset in ["tcga_brca"], (
+        "dataset must be one of: 'tcga_brca'"
+    )
+    # Locate data within the package
+    datasets_path = Path(__file__).resolve().parent.parent / "datasets" / dataset
+    # Construct file paths
+    file_map = {
+        "rna": datasets_path / "rna.csv",
+        "cnv": datasets_path / "cnv.csv",
+        "metadata": datasets_path / "metadata.csv",
+        "cnv_tumor": datasets_path / "cnv_tumor.csv",
+    }
+    data_path = file_map[modality]
+    if not data_path.exists():
+        raise FileNotFoundError(f"Data file not found: {data_path}")
+    # Load the CSV
+    df = pd.read_csv(data_path, index_col=0)
+    # Apply debug mode subsampling
+    if debug:
+        df = df.sample(n=min(10, df.shape[0]), random_state=debug_seed)
+        if modality in ["rna", "cnv"]:
+            df = df.sample(n=min(100, df.shape[1]), axis=1, random_state=debug_seed)
+    return df
+def replace_underscores(factors: List[str]):
+    """Replace all underscores from strings in a list by hyphens.
+    To be used on design factors to avoid bugs due to the reliance on
+    ``str.split("_")`` in parts of the code.
+    Parameters
+    ----------
+    factors : list
+        A list of strings which may contain underscores.
+    Returns
+    -------
+    list
+        A list of strings in which underscores were replaced by hyphens.
+    """
+    return [factor.replace("_", "-") for factor in factors]
 def filter_low_count_genes(
     df: pd.DataFrame,
     other_dfs: Optional[List[pd.DataFrame]] = None,

{deconveil-0.1.2.dist-info → deconveil-0.1.3.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: DeConveil
-Version: 0.1.2
+Version: 0.1.3
 Summary: An extension of PyDESeq2/DESeq2 designed to account for genome aneuploidy
 Home-page: https://github.com/caravagnalab/DeConveil
 Author: Katsiaryna Davydzenka

{deconveil-0.1.2.dist-info → deconveil-0.1.3.dist-info}/RECORD RENAMED Viewed

@@ -1,5 +1,5 @@
 deconveil/__init__.py,sha256=_6FL_AYiycv9nP3mKJiQ4zl4aU83YSWnV2YoIZr9Mv0,188
-deconveil/__version__.py,sha256=K5SiDdEGYMpdqXThrqwTqECJJBOQNTQDrnpc2K5mzKs,21
+deconveil/__version__.py,sha256=XEqb2aiIn8fzGE68Mph4ck1FtQqsR_am0wRWvrYPffQ,22
 deconveil/dds.py,sha256=0MNwtDzCjqjoJR-rrCmVu3JOaDd3gXuToOzTBXJMxak,49039
 deconveil/default_inference.py,sha256=J40O0-qZChLnLrLGmhwxjaTVsV7REWAUQOTf8qSwWk0,9466
 deconveil/ds.py,sha256=Vb9p152U1KXltrXFpMoBxY6YRW25dP4CO26_osbz6Aw,29476
@@ -8,9 +8,9 @@ deconveil/inference.py,sha256=B3zf3q_mbCTX3gHJwuXnTuy9uyXOxEjuWyaSR6VtVEo,10429
 deconveil/utils_clustering.py,sha256=twspPvXQ6pvw_NaY1ebyvswuH3ZvVBGn7DeOpZ1XatI,5939
 deconveil/utils_fit.py,sha256=SdGcBQjN3cyzbSFessufYOOOJAQCOjNcy3etbwmodsM,21583
 deconveil/utils_plot.py,sha256=1JQthYXaEUKUWa0fy8owkyJ1CTkQxlrSRAqPkXMk7Us,9857
-deconveil/utils_processing.py,sha256=CB99CwQst7eUiIgE58yl7_3E6uD9CgQoU_Qmprjyt-s,4141
-deconveil-0.1.2.dist-info/licenses/LICENSE,sha256=BJ0f3JRteiF7tjiARi8syxiu4yKmckc0nWlHCKXttKQ,1078
-deconveil-0.1.2.dist-info/METADATA,sha256=JqHZYXo0lLvPjoj_cDT-IwHADSKdESJQxorDbpsk3-k,1097
-deconveil-0.1.2.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
-deconveil-0.1.2.dist-info/top_level.txt,sha256=yAWZbw0eg8XpbMsswoq-VzBGfQHrfWOqNHnu2qQ2xO4,10
-deconveil-0.1.2.dist-info/RECORD,,
+deconveil/utils_processing.py,sha256=9j35FAfQ7oNjdH1FWHP90DBTyL5RwlgdVbbW9de10VI,6560
+deconveil-0.1.3.dist-info/licenses/LICENSE,sha256=BJ0f3JRteiF7tjiARi8syxiu4yKmckc0nWlHCKXttKQ,1078
+deconveil-0.1.3.dist-info/METADATA,sha256=yL6AwQ5ziGhrI5lE4FDCHOadT81W6yEIDWGsHni6Q5w,1097
+deconveil-0.1.3.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
+deconveil-0.1.3.dist-info/top_level.txt,sha256=yAWZbw0eg8XpbMsswoq-VzBGfQHrfWOqNHnu2qQ2xO4,10
+deconveil-0.1.3.dist-info/RECORD,,

{deconveil-0.1.2.dist-info → deconveil-0.1.3.dist-info}/WHEEL RENAMED Viewed

File without changes

{deconveil-0.1.2.dist-info → deconveil-0.1.3.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

{deconveil-0.1.2.dist-info → deconveil-0.1.3.dist-info}/top_level.txt RENAMED Viewed

File without changes

DeConveil 0.1.2__py3-none-any.whl → 0.1.3__py3-none-any.whl

DeConveil 0.1.2py3-none-any.whl → 0.1.3py3-none-any.whl