PyPI - metahq-core - Versions diffs - 0.1.2__py3-none-any.whl → 1.0.0rc1__py3-none-any.whl - Mend

metahq-core 0.1.2py3-none-any.whl → 1.0.0rc1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (23) hide show

metahq_core/__init__.py +1 -1
metahq_core/curations/annotation_converter.py +5 -5
metahq_core/curations/annotations.py +361 -151
metahq_core/curations/index.py +104 -43
metahq_core/curations/labels.py +259 -128
metahq_core/curations/propagator.py +62 -85
metahq_core/export/__init__.py +0 -0
metahq_core/export/annotations.py +125 -59
metahq_core/export/labels.py +128 -70
metahq_core/logger.py +11 -18
metahq_core/query.py +346 -241
metahq_core/{ontology/loader.py → relations_loader.py} +2 -1
metahq_core/search.py +37 -14
metahq_core/util/io.py +109 -46
metahq_core/util/supported.py +16 -5
{metahq_core-0.1.2.dist-info → metahq_core-1.0.0rc1.dist-info}/METADATA +13 -6
metahq_core-1.0.0rc1.dist-info/RECORD +30 -0
{metahq_core-0.1.2.dist-info → metahq_core-1.0.0rc1.dist-info}/WHEEL +1 -1
metahq_core-1.0.0rc1.dist-info/licenses/LICENSE +28 -0
metahq_core/ontology/base.py +0 -376
metahq_core/ontology/graph.py +0 -252
metahq_core-0.1.2.dist-info/RECORD +0 -30
/metahq_core/{ontology → curations}/__init__.py +0 -0

metahq_core/curations/annotations.py CHANGED Viewed

@@ -4,7 +4,7 @@ Class for storing and mutating annotation collections.
 Author: Parker Hicks
 Date: 2025-04-14
-Last updated: 2025-11-21 by Parker Hicks
+Last updated: 2026-02-02 by Parker Hicks
 """
 from __future__ import annotations
@@ -20,7 +20,7 @@ from metahq_core.curations.index import Ids
 from metahq_core.curations.labels import Labels
 from metahq_core.export.annotations import AnnotationsExporter
 from metahq_core.logger import setup_logger
-from metahq_core.util.alltypes import FilePath
+from metahq_core.util.supported import get_default_log_dir
 if TYPE_CHECKING:
     import logging
@@ -31,87 +31,24 @@ class Annotations(BaseCuration):
     Class to store and mutate annotations of samples to various attributes
     like tissues, dieases, sexes, ages, etc.
-    Attributes
-    ----------
-    data: pl.DataFrame
-        Polars DataFrame with columns `index`, `groups` and columns for each
-        attribute entity for each index (e.g. male or female, tissues, diseases, etc).
+    Attributes:
+        data (pl.DataFrame):
+            Polars DataFrame with index and group ID columns and columns for each
+                attribute entity for each index (e.g. male or female, tissues, diseases, etc).
-    disease: bool
-        Indicates if the annotations are disease based. Used to account for control samples
-        when converting annotations to labels.
+        disease (bool):
+            Indicates if the annotations are disease based. Used to account for control samples
+                when converting annotations to labels.
-    index_col: IdArray
-        Name of the column of data that contains the index IDs.
+        index_col (str):
+            Name of the column of data that contains the index IDs.
-    group_cols: tuple
-        Names of columns of data that contain an ID for each index indicating if it belongs
-        to a particular group (e.g. dataset, sex, platform, etc.).
-    collapsed: bool
-        Indicates if the annotations have already been collapsed.
-    Methods
-    -------
-    collapse()
-        Collapses index annotations to group annotations.
-    drop()
-        Wrapper for polars `drop`.
-    filter()
-        Wrapper for polars `filter`.
-    from_df()
-        Creates an Annotations object from a polars DataFrame or LazyFrame.
-    head()
-        Wrapper for polars `head`.
-    propagate_controls()
-        Propagates control samples to diseases that other samples in the same
-        dataset are annotated to.
-    select()
-        Wrapper for polars `select`.
-    slice()
-        Wrapper for polars `slice`.
-    to_labels()
-        Propagates annotations to labels for an annotations matrix, given a reference
-        ontology.
-    to_numpy()
-        Returns the annotations frame as a numpy 2D array.
-    to_parquet()
-        Saves the annotations frame and IDs to a .parquet file.
-    Properties
-    ---------
-    entities: list[str]
-        columns of the annotations frame of ontology terms.
-    groups: list[str]
-        Groups associated with each index of the annotations curation.
-        Note that groups are not unique.
-    ids: pl.DataFrame
-        The frame of all IDs within the annotations curation.
-    index
-        The index IDs of the annotations frame.
-    n_entities: int
-        Number of unique entities.
-    n_index: int
-        Number of indices.
-    unique_groups: list[str]
-        Unique groups in the annotations curation.
+        group_cols (tuple[str, ...]):
+            Names of columns of data that contain an ID for each index indicating if it belongs
+                to a particular group (e.g. dataset, sex, platform, etc.).
+        collapsed (bool):
+            Indicates if the annotations have already been collapsed.
     """
     def __init__(
@@ -123,7 +60,7 @@ class Annotations(BaseCuration):
         collapsed: bool = False,
         logger=None,
         loglevel=20,
-        logdir=Path("."),
+        logdir=get_default_log_dir(),
         verbose=True,
     ):
         self.data = data
@@ -139,14 +76,21 @@ class Annotations(BaseCuration):
         self.verbose: bool = verbose
     def add_ids(self, new: pl.DataFrame) -> Annotations:
-        """
-        Append new group ID columns to the IDs of an Annotations object. The new
+        """Append new group ID columns to the IDs of an Annotations object. The new
         IDs must have a matching index.
+        Arguments:
+            new (pl.DataFrame):
+                A DataFrame of additional IDs to join with the current index column of `data`.
+                    Must have a matching index column as the original `data`.
+        Returns:
+            A new Annotations object including the new ID columns.
         """
         new_ids = new.join(
             self.ids, on=self.index_col, how="inner", maintain_order="right"
         )
-        new_groups = tuple([col for col in new_ids.columns if col != self.index_col])
+        new_groups = tuple(col for col in new_ids.columns if col != self.index_col)
         assert new_ids.height == self.ids.height, "SRA IDs height mismatch."
         assert (
             new_ids[self.index_col].to_list() == self.index
@@ -157,15 +101,13 @@ class Annotations(BaseCuration):
         )
     def collapse(self, on: str, inplace: bool = True):
-        """
-        Collapses annotations on the specified grouping column.
-        Args
-        ----
-        on: str
-            The column to collapse on (should be one of the group_cols)
-        inplace: bool
-            If True, updates this object and returns self. If False, returns new object.
+        """Collapses annotations on the specified grouping column.
+        Arguments:
+            on (str):
+                The column to collapse on. This should be one of the columns in `group_cols`.
+            inplace (bool):
+                If True, updates this object and returns self. Otherwise, returns new object.
         """
         params = self._collapse(on)
@@ -180,7 +122,9 @@ class Annotations(BaseCuration):
         return self.__class__(**params)
     def drop(self, *args, **kwargs) -> Annotations:
-        """Wrapper for polars drop. Drops any of the term columns."""
+        """Wrapper for polars drop. Drops any of the term columns.
+        ID columns are not dropped through this method.
+        """
         return self.__class__(
             data=self.data.drop(*args, **kwargs),
             ids=self.ids,
@@ -192,7 +136,31 @@ class Annotations(BaseCuration):
         )
     def filter(self, condition: pl.Expr) -> Annotations:
-        """Filter both data and ids simultaneously using a mask."""
+        """Filter both data and ids simultaneously using a mask.
+        Arguments:
+            condition (pl.Expr):
+                Polars expression for filtering columns.
+        Examples:
+            >>> from metahq_core.curations.annotations import Annotations
+            >>> anno = {
+                    'sample': ['GSM1', 'GSM2', 'GSM3'],
+                    'series': ['GSE1', 'GSE1', 'GSE2'],
+                    'UBERON:0000948': [1, 0, 0],
+                    'UBERON:0002113': [0, 1, 0],
+                    'UBERON:0000955': [0, 0, 1],
+                }
+            >>> anno = Annotations.from_df(anno, index_col="sample", group_cols=["series"])
+            >>> anno.filter(pl.col("UBERON:0000948") == 1)
+            ┌────────┬────────┬────────────────┬────────────────┬────────────────┐
+            │ sample ┆ series ┆ UBERON:0000948 ┆ UBERON:0002113 ┆ UBERON:0000955 │
+            │ ---    ┆ ---    ┆ ---            ┆ ---            ┆ ---            │
+            │ str    ┆ str    ┆ i32            ┆ i32            ┆ i32            │
+            ╞════════╪════════╪════════════════╪════════════════╪════════════════╡
+            │ GSM1   ┆ GSE1   ┆ 1              ┆ 0              ┆ 0              │
+            └────────┴────────┴────────────────┴────────────────┴────────────────┘
+        """
         mask = self.data.select(condition.arg_true()).to_numpy().reshape(-1)
         filtered_data = (
@@ -216,29 +184,58 @@ class Annotations(BaseCuration):
     def save(
         self,
-        outfile: FilePath,
+        outfile: str | Path,
         fmt: Literal["json", "parquet", "csv", "tsv"],
+        attribute: str,
+        level: str,
         metadata: str | None = None,
     ):
-        """
-        Save annotations curation to json. Keys are terms and values are
-        positively annotated indices.
+        """Save the annotations curation.
-        Parameters
-        ----------
-        outfile: FilePath
-            Path to outfile.json.
+        Arguments:
+            outfile (str | Path):
+                Path to outfile.json.
-        metadata: bool
-            If True, will add index titles to each entry.
+            fmt (Literal["json", "parquet", "csv", "tsv"]):
+                File format to save to.
+            attribute (str):
+                A supported MetaHQ annotated attribute.
+            level (str):
+                An index level supported by MetaHQ.
+            metadata (bool):
+                If True, will add index titles to each entry.
         """
-        AnnotationsExporter(logger=self.log, verbose=self.verbose).save(
-            self, fmt, outfile, metadata
-        )
+        AnnotationsExporter(
+            attribute, level, logger=self.log, verbose=self.verbose
+        ).save(self, fmt, outfile, metadata)
     def sort_columns(self):
-        """Sorts term columns."""
+        """Sorts term columns.
+        Examples:
+            >>> from metahq_core.curations.annotations import Annotations
+            >>> anno = {
+                    'sample': ['GSM1', 'GSM2', 'GSM3'],
+                    'series': ['GSE1', 'GSE1', 'GSE2'],
+                    'UBERON:0000948': [1, 0, 0],
+                    'UBERON:0002113': [0, 1, 0],
+                    'UBERON:0000955': [0, 0, 1],
+                }
+            >>> anno = Annotations.from_df(anno, index_col="sample", group_cols=["series"])
+            >>> anno.sort_columns()
+            ┌────────┬────────┬────────────────┬────────────────┬────────────────┐
+            │ series ┆ sample ┆ UBERON:0000948 ┆ UBERON:0000955 ┆ UBERON:0002113 │
+            │ ---    ┆ ---    ┆ ---            ┆ ---            ┆ ---            │
+            │ str    ┆ str    ┆ i32            ┆ i32            ┆ i32            │
+            ╞════════╪════════╪════════════════╪════════════════╪════════════════╡
+            │ GSE1   ┆ GSM1   ┆ 1              ┆ 0              ┆ 0              │
+            │ GSE1   ┆ GSM2   ┆ 0              ┆ 0              ┆ 1              │
+            │ GSE2   ┆ GSM3   ┆ 0              ┆ 1              ┆ 0              │
+            └────────┴────────┴────────────────┴────────────────┴────────────────┘
+        """
         return self.__class__(
             data=self.data.select(sorted(self.data.columns)),
             ids=self.ids,
@@ -260,35 +257,72 @@ class Annotations(BaseCuration):
         Assigns propagated labels to terms given their annotations.
-        Parameters
-        ----------
-        to_terms: list[str]
-            Array of terms to generate labels for, or "union"/"all".
-        ontology: str
-            The name of an ontology to reference for annotation propagation.
-        mode: Literal[0, 1]
-            Mode of propagation.
-            If mode is 0, this will propagate any positive annotations
-            from any descendants of the to_terms up to the to_terms.
-            If mode 1, this will convert annotations to -1, 0, +1 labels
-            where for a particular term, if an index is annotated to that term or
-            any of its descendants, it recieves a +1 label. If it is annotated to an
-            ancestor of that term, it receives a 0 (unsure) label. If it is not annotated
-            to an ancestor or a descendant of that term, it recieves a -1 label.
-            Any indices annotated to the control column are assigned a label of 2 for any
-            terms that other indices within the same group are positively labeled to.
-        control_col: str
-            Column name for control annotations.
-        Returns
-        -------
-        A Labels curation object with propagated -1, 0, +1 labels (and 2 if controls are present).
+        Arguments:
+            to_terms (list[str]):
+                Array of terms to generate labels for, or "union"/"all".
+            ontology (str):
+                The name of an ontology to reference for annotation propagation.
+            mode (Literal[0, 1]):
+                Mode of propagation.
+                    If mode is 0, this will propagate any positive annotations
+                    from any descendants of the to_terms up to the to_terms.
+                    If mode 1, this will convert annotations to -1, 0, +1 labels
+                    where for a particular term, if an index is annotated to that term or
+                    any of its descendants, it recieves a +1 label. If it is annotated to an
+                    ancestor of that term, it receives a 0 (unsure) label. If it is not annotated
+                    to an ancestor or a descendant of that term, it recieves a -1 label.
+                    Any indices annotated to the control column are assigned a label of 2 for any
+                    terms that other indices within the same group are positively labeled to.
+            control_col (str):
+                Column name for control annotations.
+        Returns:
+            A Labels curation object with propagated -1, 0, +1 labels (and 2 if controls are
+            present). Any entries in `index_col` that have a 0 annotation/label across all
+            entity columns are dropped.
+        Examples:
+            With `mode=0`:
+            >>> anno = pl.DataFrame(
+                    {
+                        "series": ["GSE1", "GSE1", "GSE2"],
+                        "sample": ["GSM1", "GSM2", "GSM3"],
+                        "UBERON:0000948": [1, 0, 0],
+                        "UBERON:0002349": [1, 1, 0],
+                        "UBERON:0002113": [0, 0, 0],
+                        "UBERON:0000955": [0, 0, 1],
+                    }
+                )
+            >>> anno = Annotations.from_df(anno, index_col="sample", group_cols=["series"])
+            >>> anno.propagate(to_terms=["UBERON:0000948"], ontology="uberon", mode=0)
+            ┌────────┬────────┬────────────────┐
+            │ sample ┆ series ┆ UBERON:0000948 │
+            │ ---    ┆ ---    ┆ ---            │
+            │ str    ┆ str    ┆ i32            │
+            ╞════════╪════════╪════════════════╡
+            │ GSM1   ┆ GSE1   ┆ 1              │
+            │ GSM2   ┆ GSE1   ┆ 1              │
+            └────────┴────────┴────────────────┘
+            With `mode=1`:
+            >>> anno.propagate(to_terms=["UBERON:0000948"], ontology="uberon", mode=1)
+            ┌────────┬────────┬────────────────┐
+            │ sample ┆ series ┆ UBERON:0000948 │
+            │ ---    ┆ ---    ┆ ---            │
+            │ str    ┆ str    ┆ i32            │
+            ╞════════╪════════╪════════════════╡
+            │ GSM1   ┆ GSE1   ┆ 1              │
+            │ GSM2   ┆ GSE1   ┆ 1              │
+            │ GSM3   ┆ GSE2   ┆ -1             │
+            └────────┴────────┴────────────────┘
         """
         converter = AnnotationsConverter(
             self,
@@ -334,7 +368,18 @@ class Annotations(BaseCuration):
         )
     def slice(self, offset: int, length: int | None = None) -> Annotations:
-        """Slice both data and ids simultaneously using polars slice."""
+        """Slice both data and ids simultaneously using `polars` slice.
+        Arguments:
+            offset (int):
+                Index position to begin the slice.
+            length (int | None):
+                Number of indices past `offset` to slice out.
+        Returns:
+            Sliced Annotations object as a subset of the original Annotations.
+        """
         sliced_data = self.data.slice(offset, length)
         sliced_ids_data = self._ids.data.slice(offset, length)
@@ -349,7 +394,9 @@ class Annotations(BaseCuration):
         )
     def _collapse(self, on: str):
-        """Collapses index-level annotations to group-level."""
+        """Collapses index-level annotations to group-level. Helper function
+        for `collapse`.
+        """
         index_anno = self.data.with_columns(self.ids[on])
         agg_anno = index_anno.group_by(on).agg(pl.col("*").sum()).sort(on)
         new_ids = self._collapse_ids(on, keep=agg_anno[on].to_list())
@@ -376,7 +423,9 @@ class Annotations(BaseCuration):
         return params
     def _collapse_ids(self, on: str, keep: list[str]):
-        """Group IDs to keep in the new collapsed frame."""
+        """Group IDs to keep in the new collapsed frame. Helper function
+        for `collapse`.
+        """
         return (
             self.ids.drop(self.index_col)
             .unique()
@@ -389,11 +438,49 @@ class Annotations(BaseCuration):
         cls,
         df: pl.DataFrame,
         index_col: str,
-        group_cols: tuple[str, ...] | list[str] = ("series", "platform"),
+        group_cols: tuple[str, ...] | list[str],
         **kwargs,
     ) -> Annotations:
-        """Creates an Annotations object from a combined DataFrame."""
+        """Creates an Annotations object from a combined DataFrame.
+        Attributes:
+            df (pl.DataFrame):
+                Polars DataFrame with index and group ID columns and columns for each
+                    attribute entity for each index (e.g. male or female, tissues, diseases, etc).
+            index_col (str):
+                Name of the column of data that contains the index IDs.
+            group_cols (tuple[str, ...]):
+                Names of columns of data that contain an ID for each index indicating if it belongs
+                    to a particular group (e.g. dataset, sex, platform, etc.).
+        Returns:
+            An Annotations object constructed from `df`.
+        Examples:
+            >>> from metahq_core.curations.annotations import Annotations
+            >>> anno = pl.DataFrame(
+                    {
+                        "series": ["GSE1", "GSE1", "GSE2"],
+                        "sample": ["GSM1", "GSM2", "GSM3"],
+                        "UBERON:0000948": [1, 0, 0],
+                        "UBERON:0002349": [1, 1, 0],
+                        "UBERON:0002113": [0, 0, 0],
+                        "UBERON:0000955": [0, 0, 1],
+                    }
+                )
+            >>> anno = Annotations.from_df(anno, index_col="sample", group_cols=["series"])
+            ┌────────┬────────┬────────────────┬────────────────┬────────────────┬────────────────┐
+            │ sample ┆ series ┆ UBERON:0000948 ┆ UBERON:0002349 ┆ UBERON:0002113 ┆ UBERON:0000955 │
+            │ ---    ┆ ---    ┆ ---            ┆ ---            ┆ ---            ┆ ---            │
+            │ str    ┆ str    ┆ i64            ┆ i64            ┆ i64            ┆ i64            │
+            ╞════════╪════════╪════════════════╪════════════════╪════════════════╪════════════════╡
+            │ GSM1   ┆ GSE1   ┆ 1              ┆ 1              ┆ 0              ┆ 0              │
+            │ GSM2   ┆ GSE1   ┆ 0              ┆ 1              ┆ 0              ┆ 0              │
+            │ GSM3   ┆ GSE2   ┆ 0              ┆ 0              ┆ 0              ┆ 1              │
+            └────────┴────────┴────────────────┴────────────────┴────────────────┴────────────────┘
+        """
         group_cols = tuple(group_cols)
         id_columns = [index_col] + list(group_cols)
         ids_data = df.select(id_columns)
@@ -409,37 +496,160 @@ class Annotations(BaseCuration):
     @property
     def entities(self) -> list[str]:
-        """Returns term names of the Annotations frame."""
+        """Returns term names of the Annotations frame.
+        Examples:
+            >>> anno = pl.DataFrame(
+                    {
+                        "series": ["GSE1", "GSE1", "GSE2"],
+                        "sample": ["GSM1", "GSM2", "GSM3"],
+                        "UBERON:0000948": [1, 0, 0],
+                        "UBERON:0002349": [1, 1, 0],
+                        "UBERON:0002113": [0, 0, 0],
+                        "UBERON:0000955": [0, 0, 1],
+                    }
+                )
+            >>> anno = Annotations.from_df(anno, index_col="sample", group_cols=["series"])
+            >>> anno.entities
+            ['UBERON:0000955', 'UBERON:0002349', 'UBERON:0000948', 'UBERON:0002113']
+        """
         return list(set(self.data.columns) - set(self.ids.columns))
     @property
     def groups(self) -> list[str]:
-        """Returns the groups column of the Annotations curation."""
+        """Returns the groups column of the Annotations curation.
+        Examples:
+            >>> anno = pl.DataFrame(
+                    {
+                        "series": ["GSE1", "GSE1", "GSE2"],
+                        "sample": ["GSM1", "GSM2", "GSM3"],
+                        "UBERON:0000948": [1, 0, 0],
+                        "UBERON:0002349": [1, 1, 0],
+                        "UBERON:0002113": [0, 0, 0],
+                        "UBERON:0000955": [0, 0, 1],
+                    }
+                )
+            >>> anno = Annotations.from_df(anno, index_col="sample", group_cols=["series"])
+            >>> anno.groups
+            ['GSE1', 'GSE1', 'GSE2']
+        """
         return self.ids["series"].to_list()
     @property
     def ids(self) -> pl.DataFrame:
-        """Return the IDs dataframe."""
+        """Return the IDs dataframe.
+        Examples:
+            >>> anno = pl.DataFrame(
+                    {
+                        "series": ["GSE1", "GSE1", "GSE2"],
+                        "sample": ["GSM1", "GSM2", "GSM3"],
+                        "UBERON:0000948": [1, 0, 0],
+                        "UBERON:0002349": [1, 1, 0],
+                        "UBERON:0002113": [0, 0, 0],
+                        "UBERON:0000955": [0, 0, 1],
+                    }
+                )
+            >>> anno = Annotations.from_df(anno, index_col="sample", group_cols=["series"])
+            >>> anno.ids
+            ┌────────┬────────┐
+            │ sample ┆ series │
+            │ ---    ┆ ---    │
+            │ str    ┆ str    │
+            ╞════════╪════════╡
+            │ GSM1   ┆ GSE1   │
+            │ GSM2   ┆ GSE1   │
+            │ GSM3   ┆ GSE2   │
+            └────────┴────────┘
+        """
         return self._ids.data
     @property
-    def index(self) -> list:
-        """Return the index column as a list."""
+    def index(self) -> list[str]:
+        """Return the index column as a list.
+        Examples:
+            >>> anno = pl.DataFrame(
+                    {
+                        "series": ["GSE1", "GSE1", "GSE2"],
+                        "sample": ["GSM1", "GSM2", "GSM3"],
+                        "UBERON:0000948": [1, 0, 0],
+                        "UBERON:0002349": [1, 1, 0],
+                        "UBERON:0002113": [0, 0, 0],
+                        "UBERON:0000955": [0, 0, 1],
+                    }
+                )
+            >>> anno = Annotations.from_df(anno, index_col="sample", group_cols=["series"])
+            >>> anno.index
+            ['GSM1', 'GSM2', 'GSM3']
+        """
         return self._ids.index.to_list()
     @property
     def n_indices(self) -> int:
-        """Returns number of indices."""
+        """Returns number of indices.
+        Examples:
+            >>> anno = pl.DataFrame(
+                    {
+                        "series": ["GSE1", "GSE1", "GSE2"],
+                        "sample": ["GSM1", "GSM2", "GSM3"],
+                        "UBERON:0000948": [1, 0, 0],
+                        "UBERON:0002349": [1, 1, 0],
+                        "UBERON:0002113": [0, 0, 0],
+                        "UBERON:0000955": [0, 0, 1],
+                    }
+                )
+            >>> anno = Annotations.from_df(anno, index_col="sample", group_cols=["series"])
+            >>> anno.n_indices
+            3
+        """
         return self.data.height
     @property
     def n_entities(self) -> int:
-        """Returns number of entities."""
+        """Returns number of entities.
+        Examples:
+            >>> anno = pl.DataFrame(
+                    {
+                        "series": ["GSE1", "GSE1", "GSE2"],
+                        "sample": ["GSM1", "GSM2", "GSM3"],
+                        "UBERON:0000948": [1, 0, 0],
+                        "UBERON:0002349": [1, 1, 0],
+                        "UBERON:0002113": [0, 0, 0],
+                        "UBERON:0000955": [0, 0, 1],
+                    }
+                )
+            >>> anno = Annotations.from_df(anno, index_col="sample", group_cols=["series"])
+            >>> anno.n_entities
+            4
+        """
         return len(self.entities)
     @property
     def unique_groups(self) -> list[str]:
-        """Returns unique groups."""
+        """Returns unique groups.
+        Examples:
+            >>> anno = pl.DataFrame(
+                    {
+                        "series": ["GSE1", "GSE1", "GSE2"],
+                        "sample": ["GSM1", "GSM2", "GSM3"],
+                        "UBERON:0000948": [1, 0, 0],
+                        "UBERON:0002349": [1, 1, 0],
+                        "UBERON:0002113": [0, 0, 0],
+                        "UBERON:0000955": [0, 0, 1],
+                    }
+                )
+            >>> anno = Annotations.from_df(anno, index_col="sample", group_cols=["series"])
+            >>> anno.unique_groups
+            ['GSE2', 'GSE1']
+        """
         return list(set(self.groups))
     def __repr__(self):

metahq-core 0.1.2__py3-none-any.whl → 1.0.0rc1__py3-none-any.whl

metahq-core 0.1.2py3-none-any.whl → 1.0.0rc1py3-none-any.whl