PyPI - pyobo - Versions diffs - 0.11.2__py3-none-any.whl → 0.12.0__py3-none-any.whl - Mend

pyobo 0.11.2py3-none-any.whl → 0.12.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (227) hide show

pyobo/.DS_Store +0 -0
pyobo/__init__.py +95 -20
pyobo/__main__.py +0 -0
pyobo/api/__init__.py +81 -10
pyobo/api/alts.py +52 -42
pyobo/api/combine.py +39 -0
pyobo/api/edges.py +68 -0
pyobo/api/hierarchy.py +231 -203
pyobo/api/metadata.py +14 -19
pyobo/api/names.py +207 -127
pyobo/api/properties.py +117 -113
pyobo/api/relations.py +68 -94
pyobo/api/species.py +24 -21
pyobo/api/typedefs.py +11 -11
pyobo/api/utils.py +66 -13
pyobo/api/xrefs.py +108 -114
pyobo/cli/__init__.py +0 -0
pyobo/cli/cli.py +35 -50
pyobo/cli/database.py +183 -161
pyobo/{xrefdb/xrefs_pipeline.py → cli/database_utils.py} +54 -73
pyobo/cli/lookup.py +163 -195
pyobo/cli/utils.py +19 -6
pyobo/constants.py +102 -3
pyobo/getters.py +196 -118
pyobo/gilda_utils.py +79 -200
pyobo/identifier_utils/__init__.py +41 -0
pyobo/identifier_utils/api.py +296 -0
pyobo/identifier_utils/model.py +130 -0
pyobo/identifier_utils/preprocessing.json +812 -0
pyobo/identifier_utils/preprocessing.py +61 -0
pyobo/identifier_utils/relations/__init__.py +8 -0
pyobo/identifier_utils/relations/api.py +162 -0
pyobo/identifier_utils/relations/data.json +5824 -0
pyobo/identifier_utils/relations/data_owl.json +57 -0
pyobo/identifier_utils/relations/data_rdf.json +1 -0
pyobo/identifier_utils/relations/data_rdfs.json +7 -0
pyobo/mocks.py +9 -6
pyobo/ner/__init__.py +9 -0
pyobo/ner/api.py +72 -0
pyobo/ner/normalizer.py +33 -0
pyobo/obographs.py +43 -39
pyobo/plugins.py +5 -4
pyobo/py.typed +0 -0
pyobo/reader.py +1358 -395
pyobo/reader_utils.py +155 -0
pyobo/resource_utils.py +42 -22
pyobo/resources/__init__.py +0 -0
pyobo/resources/goc.py +75 -0
pyobo/resources/goc.tsv +188 -0
pyobo/resources/ncbitaxon.py +4 -5
pyobo/resources/ncbitaxon.tsv.gz +0 -0
pyobo/resources/ro.py +3 -2
pyobo/resources/ro.tsv +0 -0
pyobo/resources/so.py +0 -0
pyobo/resources/so.tsv +0 -0
pyobo/sources/README.md +12 -8
pyobo/sources/__init__.py +52 -29
pyobo/sources/agrovoc.py +0 -0
pyobo/sources/antibodyregistry.py +11 -12
pyobo/sources/bigg/__init__.py +13 -0
pyobo/sources/bigg/bigg_compartment.py +81 -0
pyobo/sources/bigg/bigg_metabolite.py +229 -0
pyobo/sources/bigg/bigg_model.py +46 -0
pyobo/sources/bigg/bigg_reaction.py +77 -0
pyobo/sources/biogrid.py +1 -2
pyobo/sources/ccle.py +7 -12
pyobo/sources/cgnc.py +0 -5
pyobo/sources/chebi.py +1 -1
pyobo/sources/chembl/__init__.py +9 -0
pyobo/sources/{chembl.py → chembl/chembl_compound.py} +13 -25
pyobo/sources/chembl/chembl_target.py +160 -0
pyobo/sources/civic_gene.py +55 -15
pyobo/sources/clinicaltrials.py +160 -0
pyobo/sources/complexportal.py +24 -24
pyobo/sources/conso.py +14 -22
pyobo/sources/cpt.py +0 -0
pyobo/sources/credit.py +1 -9
pyobo/sources/cvx.py +27 -5
pyobo/sources/depmap.py +9 -12
pyobo/sources/dictybase_gene.py +2 -7
pyobo/sources/drugbank/__init__.py +9 -0
pyobo/sources/{drugbank.py → drugbank/drugbank.py} +11 -16
pyobo/sources/{drugbank_salt.py → drugbank/drugbank_salt.py} +3 -8
pyobo/sources/drugcentral.py +17 -13
pyobo/sources/expasy.py +31 -34
pyobo/sources/famplex.py +13 -18
pyobo/sources/flybase.py +3 -8
pyobo/sources/gard.py +62 -0
pyobo/sources/geonames/__init__.py +9 -0
pyobo/sources/geonames/features.py +28 -0
pyobo/sources/{geonames.py → geonames/geonames.py} +87 -26
pyobo/sources/geonames/utils.py +115 -0
pyobo/sources/gmt_utils.py +6 -7
pyobo/sources/go.py +20 -13
pyobo/sources/gtdb.py +154 -0
pyobo/sources/gwascentral/__init__.py +9 -0
pyobo/sources/{gwascentral_phenotype.py → gwascentral/gwascentral_phenotype.py} +5 -7
pyobo/sources/{gwascentral_study.py → gwascentral/gwascentral_study.py} +1 -7
pyobo/sources/hgnc/__init__.py +9 -0
pyobo/sources/{hgnc.py → hgnc/hgnc.py} +56 -70
pyobo/sources/{hgncgenefamily.py → hgnc/hgncgenefamily.py} +8 -18
pyobo/sources/icd/__init__.py +9 -0
pyobo/sources/{icd10.py → icd/icd10.py} +35 -37
pyobo/sources/icd/icd11.py +148 -0
pyobo/sources/{icd_utils.py → icd/icd_utils.py} +66 -20
pyobo/sources/interpro.py +4 -9
pyobo/sources/itis.py +0 -5
pyobo/sources/kegg/__init__.py +0 -0
pyobo/sources/kegg/api.py +16 -38
pyobo/sources/kegg/genes.py +9 -20
pyobo/sources/kegg/genome.py +1 -7
pyobo/sources/kegg/pathway.py +9 -21
pyobo/sources/mesh.py +58 -24
pyobo/sources/mgi.py +3 -10
pyobo/sources/mirbase/__init__.py +11 -0
pyobo/sources/{mirbase.py → mirbase/mirbase.py} +8 -11
pyobo/sources/{mirbase_constants.py → mirbase/mirbase_constants.py} +0 -0
pyobo/sources/{mirbase_family.py → mirbase/mirbase_family.py} +4 -8
pyobo/sources/{mirbase_mature.py → mirbase/mirbase_mature.py} +3 -7
pyobo/sources/msigdb.py +74 -39
pyobo/sources/ncbi/__init__.py +9 -0
pyobo/sources/ncbi/ncbi_gc.py +162 -0
pyobo/sources/{ncbigene.py → ncbi/ncbigene.py} +18 -19
pyobo/sources/nih_reporter.py +60 -0
pyobo/sources/nlm/__init__.py +9 -0
pyobo/sources/nlm/nlm_catalog.py +48 -0
pyobo/sources/nlm/nlm_publisher.py +36 -0
pyobo/sources/nlm/utils.py +116 -0
pyobo/sources/npass.py +6 -8
pyobo/sources/omim_ps.py +10 -3
pyobo/sources/pathbank.py +4 -8
pyobo/sources/pfam/__init__.py +9 -0
pyobo/sources/{pfam.py → pfam/pfam.py} +3 -8
pyobo/sources/{pfam_clan.py → pfam/pfam_clan.py} +2 -7
pyobo/sources/pharmgkb/__init__.py +15 -0
pyobo/sources/pharmgkb/pharmgkb_chemical.py +89 -0
pyobo/sources/pharmgkb/pharmgkb_disease.py +77 -0
pyobo/sources/pharmgkb/pharmgkb_gene.py +108 -0
pyobo/sources/pharmgkb/pharmgkb_pathway.py +63 -0
pyobo/sources/pharmgkb/pharmgkb_variant.py +84 -0
pyobo/sources/pharmgkb/utils.py +86 -0
pyobo/sources/pid.py +1 -6
pyobo/sources/pombase.py +6 -10
pyobo/sources/pubchem.py +4 -9
pyobo/sources/reactome.py +5 -11
pyobo/sources/rgd.py +11 -16
pyobo/sources/rhea.py +37 -36
pyobo/sources/ror.py +69 -42
pyobo/sources/selventa/__init__.py +0 -0
pyobo/sources/selventa/schem.py +4 -7
pyobo/sources/selventa/scomp.py +1 -6
pyobo/sources/selventa/sdis.py +4 -7
pyobo/sources/selventa/sfam.py +1 -6
pyobo/sources/sgd.py +6 -11
pyobo/sources/signor/__init__.py +7 -0
pyobo/sources/signor/download.py +41 -0
pyobo/sources/signor/signor_complexes.py +105 -0
pyobo/sources/slm.py +12 -15
pyobo/sources/umls/__init__.py +7 -1
pyobo/sources/umls/__main__.py +0 -0
pyobo/sources/umls/get_synonym_types.py +20 -4
pyobo/sources/umls/sty.py +57 -0
pyobo/sources/umls/synonym_types.tsv +1 -1
pyobo/sources/umls/umls.py +18 -22
pyobo/sources/unimod.py +46 -0
pyobo/sources/uniprot/__init__.py +1 -1
pyobo/sources/uniprot/uniprot.py +40 -32
pyobo/sources/uniprot/uniprot_ptm.py +4 -34
pyobo/sources/utils.py +3 -2
pyobo/sources/wikipathways.py +7 -10
pyobo/sources/zfin.py +5 -10
pyobo/ssg/__init__.py +12 -16
pyobo/ssg/base.html +0 -0
pyobo/ssg/index.html +26 -13
pyobo/ssg/term.html +12 -2
pyobo/ssg/typedef.html +0 -0
pyobo/struct/__init__.py +54 -8
pyobo/struct/functional/__init__.py +1 -0
pyobo/struct/functional/dsl.py +2572 -0
pyobo/struct/functional/macros.py +423 -0
pyobo/struct/functional/obo_to_functional.py +385 -0
pyobo/struct/functional/ontology.py +270 -0
pyobo/struct/functional/utils.py +112 -0
pyobo/struct/reference.py +331 -136
pyobo/struct/struct.py +1413 -643
pyobo/struct/struct_utils.py +1078 -0
pyobo/struct/typedef.py +162 -210
pyobo/struct/utils.py +12 -5
pyobo/struct/vocabulary.py +138 -0
pyobo/utils/__init__.py +0 -0
pyobo/utils/cache.py +13 -11
pyobo/utils/io.py +17 -31
pyobo/utils/iter.py +5 -5
pyobo/utils/misc.py +41 -53
pyobo/utils/ndex_utils.py +0 -0
pyobo/utils/path.py +76 -70
pyobo/version.py +3 -3
{pyobo-0.11.2.dist-info → pyobo-0.12.0.dist-info}/METADATA +228 -229
pyobo-0.12.0.dist-info/RECORD +202 -0
pyobo-0.12.0.dist-info/WHEEL +4 -0
{pyobo-0.11.2.dist-info → pyobo-0.12.0.dist-info}/entry_points.txt +1 -0
pyobo-0.12.0.dist-info/licenses/LICENSE +21 -0
pyobo/aws.py +0 -162
pyobo/cli/aws.py +0 -47
pyobo/identifier_utils.py +0 -142
pyobo/normalizer.py +0 -232
pyobo/registries/__init__.py +0 -16
pyobo/registries/metaregistry.json +0 -507
pyobo/registries/metaregistry.py +0 -135
pyobo/sources/icd11.py +0 -105
pyobo/xrefdb/__init__.py +0 -1
pyobo/xrefdb/canonicalizer.py +0 -214
pyobo/xrefdb/priority.py +0 -59
pyobo/xrefdb/sources/__init__.py +0 -60
pyobo/xrefdb/sources/biomappings.py +0 -36
pyobo/xrefdb/sources/cbms2019.py +0 -91
pyobo/xrefdb/sources/chembl.py +0 -83
pyobo/xrefdb/sources/compath.py +0 -82
pyobo/xrefdb/sources/famplex.py +0 -64
pyobo/xrefdb/sources/gilda.py +0 -50
pyobo/xrefdb/sources/intact.py +0 -113
pyobo/xrefdb/sources/ncit.py +0 -133
pyobo/xrefdb/sources/pubchem.py +0 -27
pyobo/xrefdb/sources/wikidata.py +0 -116
pyobo-0.11.2.dist-info/RECORD +0 -157
pyobo-0.11.2.dist-info/WHEEL +0 -5
pyobo-0.11.2.dist-info/top_level.txt +0 -1

pyobo/api/hierarchy.py CHANGED Viewed

@@ -1,291 +1,319 @@
 """High-level API for hierarchies."""
 import logging
+import warnings
 from collections.abc import Iterable
 from functools import lru_cache
-from typing import Optional
+from typing import overload
 import networkx as nx
-from .names import get_name
-from .properties import get_filtered_properties_mapping
-from .relations import get_filtered_relations_df
-from ..identifier_utils import wrap_norm_prefix
-from ..struct import TypeDef, has_member, is_a, part_of
+from curies import ReferenceTuple
+from typing_extensions import NotRequired, Unpack
+from .edges import get_edges
+from .names import get_name, get_references
+from .properties import get_literal_properties
+from .utils import _get_pi
+from ..constants import GetOntologyKwargs
+from ..struct import has_member, has_part, is_a, member_of, part_of
 from ..struct.reference import Reference
+from ..struct.struct_utils import ReferenceHint, _ensure_ref
 __all__ = [
+    "get_ancestors",
+    "get_children",
+    "get_descendants",
     "get_hierarchy",
     "get_subhierarchy",
-    "get_descendants",
-    "get_ancestors",
     "has_ancestor",
     "is_descendent",
-    "get_children",
 ]
 logger = logging.getLogger(__name__)
+class HierarchyKwargs(GetOntologyKwargs):
+    """Keyword argument hints for hierarchy getter functions."""
+    include_part_of: NotRequired[bool]
+    include_has_member: NotRequired[bool]
 def get_hierarchy(
     prefix: str,
     *,
-    include_part_of: bool = True,
-    include_has_member: bool = False,
-    extra_relations: Optional[Iterable[TypeDef]] = None,
-    properties: Optional[Iterable[str]] = None,
-    use_tqdm: bool = False,
-    force: bool = False,
-    version: Optional[str] = None,
+    extra_relations: Iterable[ReferenceHint] | None = None,
+    properties: Iterable[ReferenceHint] | None = None,
+    **kwargs: Unpack[HierarchyKwargs],
 ) -> nx.DiGraph:
     """Get hierarchy of parents as a directed graph.
     :param prefix: The name of the namespace.
-    :param include_part_of: Add "part of" relations. Only works if the relations are properly
-        defined using bfo:0000050 ! part of or bfo:0000051 ! has part
-    :param include_has_member: Add "has member" relations. These aren't part of the BFO, but
-        are hacked into PyOBO using :data:`pyobo.struct.typedef.has_member` for relationships like
-        from protein families to their actual proteins.
-    :param extra_relations: Other relations that you want to include in the hierarchy. For
-        example, it might be useful to include the positively_regulates
-    :param properties: Properties to include in the data part of each node. For example, might want
-        to include SMILES strings with the ChEBI tree.
-    :param use_tqdm: Show a progress bar
+    :param include_part_of: Add "part of" relations. Only works if the relations are
+        properly defined using bfo:0000050 ! part of or bfo:0000051 ! has part
+    :param include_has_member: Add "has member" relations. These aren't part of the BFO,
+        but are hacked into PyOBO using :data:`pyobo.struct.typedef.has_member` for
+        relationships like from protein families to their actual proteins.
+    :param extra_relations: Other relations that you want to include in the hierarchy.
+        For example, it might be useful to include the positively_regulates
+    :param properties: Properties to include in the data part of each node. For example,
+        might want to include SMILES strings with the ChEBI tree.
     :param force: should the resources be reloaded when extracting relations?
     :returns: A directional graph representing the hierarchy
-    This function thinly wraps :func:`_get_hierarchy_helper` to make it easier to work with the lru_cache mechanism.
+    This function thinly wraps :func:`_get_hierarchy_helper` to make it easier to work
+    with the lru_cache mechanism.
     """
     return _get_hierarchy_helper(
         prefix=prefix,
-        include_part_of=include_part_of,
-        include_has_member=include_has_member,
-        extra_relations=tuple(sorted(extra_relations or [], key=lambda t: t.curie)),
-        properties=tuple(sorted(properties or [])),
-        use_tqdm=use_tqdm,
-        force=force,
-        version=version,
+        extra_relations=_tp(prefix, extra_relations),
+        properties=_tp(prefix, properties),
+        **kwargs,
+    )
+def _tp(prefix: str, references: Iterable[ReferenceHint] | None) -> tuple[Reference, ...]:
+    return tuple(
+        sorted(_ensure_ref(reference, ontology_prefix=prefix) for reference in references or [])
     )
 @lru_cache
-@wrap_norm_prefix
 def _get_hierarchy_helper(
     prefix: str,
     *,
-    extra_relations: tuple[TypeDef, ...],
-    properties: tuple[str, ...],
-    include_part_of: bool,
-    include_has_member: bool,
-    use_tqdm: bool,
-    force: bool = False,
-    version: Optional[str] = None,
+    extra_relations: tuple[Reference, ...],
+    properties: tuple[Reference, ...],
+    include_part_of: bool = False,
+    include_has_member: bool = False,
+    **kwargs: Unpack[GetOntologyKwargs],
 ) -> nx.DiGraph:
+    predicates, reverse_predicates = _get_predicate_sets(
+        extra_relations, include_part_of, include_has_member
+    )
     rv = nx.DiGraph()
+    rv.add_nodes_from(get_references(prefix, **kwargs))
-    is_a_df = get_filtered_relations_df(
-        prefix=prefix,
-        relation=is_a,
-        use_tqdm=use_tqdm,
-        force=force,
-        version=version,
-    )
-    for source_id, target_ns, target_id in is_a_df.values:
-        rv.add_edge(f"{prefix}:{source_id}", f"{target_ns}:{target_id}", relation="is_a")
+    for s, p, o in get_edges(prefix, **kwargs):
+        if p in predicates:
+            rv.add_edge(s, o, relation=p)
+        elif p in reverse_predicates:
+            rv.add_edge(o, s, relation=p)
-    if include_has_member:
-        has_member_df = get_filtered_relations_df(
-            prefix=prefix,
-            relation=has_member,
-            use_tqdm=use_tqdm,
-            force=force,
-            version=version,
-        )
-        for target_id, source_ns, source_id in has_member_df.values:
-            rv.add_edge(f"{source_ns}:{source_id}", f"{prefix}:{target_id}", relation="is_a")
+    properties_ = set(properties)
+    for s, p, op in get_literal_properties(prefix, **kwargs):
+        if s in rv and p in properties_:
+            rv.nodes[s][p] = op.value
+    return rv
+def _get_predicate_sets(
+    extra_relations: Iterable[Reference], include_part_of: bool, include_has_member: bool
+) -> tuple[set[Reference], set[Reference]]:
+    predicates: set[Reference] = {is_a.reference, *extra_relations}
+    reverse_predicates: set[Reference] = set()
     if include_part_of:
-        part_of_df = get_filtered_relations_df(
-            prefix=prefix,
-            relation=part_of,
-            use_tqdm=use_tqdm,
-            force=force,
-            version=version,
-        )
-        for source_id, target_ns, target_id in part_of_df.values:
-            rv.add_edge(f"{prefix}:{source_id}", f"{target_ns}:{target_id}", relation="part_of")
-        has_part_df = get_filtered_relations_df(
-            prefix=prefix,
-            relation=part_of,
-            use_tqdm=use_tqdm,
-            force=force,
-            version=version,
-        )
-        for target_id, source_ns, source_id in has_part_df.values:
-            rv.add_edge(f"{source_ns}:{source_id}", f"{prefix}:{target_id}", relation="part_of")
-    for relation in extra_relations:
-        if not isinstance(relation, (TypeDef, Reference)):
-            raise TypeError
-        relation_df = get_filtered_relations_df(
-            prefix=prefix,
-            relation=relation,
-            use_tqdm=use_tqdm,
-            force=force,
-            version=version,
-        )
-        for source_id, target_ns, target_id in relation_df.values:
-            rv.add_edge(
-                f"{prefix}:{source_id}", f"{target_ns}:{target_id}", relation=relation.identifier
-            )
-    for prop in properties:
-        props = get_filtered_properties_mapping(
-            prefix=prefix, prop=prop, use_tqdm=use_tqdm, force=force
-        )
-        for identifier, value in props.items():
-            curie = f"{prefix}:{identifier}"
-            if curie in rv:
-                rv.nodes[curie][prop] = value
+        predicates.add(part_of.reference)
+        reverse_predicates.add(has_part.reference)
+    if include_has_member:
+        predicates.add(has_member.reference)
+        reverse_predicates.add(member_of.reference)
+    return predicates, reverse_predicates
-    return rv
+# docstr-coverage:excused `overload`
+@overload
+def is_descendent(
+    prefix: str,
+    identifier: str,
+    ancestor_prefix: str = ...,
+    ancestor_identifier: str = ...,
+    /,
+    **kwargs: Unpack[HierarchyKwargs],
+) -> bool: ...
+# docstr-coverage:excused `overload`
+@overload
 def is_descendent(
-    prefix, identifier, ancestor_prefix, ancestor_identifier, *, version: Optional[str] = None
+    descendant: Reference,
+    ancestor: Reference,
+    _1: None = ...,
+    _2: None = ...,
+    /,
+    **kwargs: Unpack[HierarchyKwargs],
+) -> bool: ...
+def is_descendent(
+    prefix: str | Reference,
+    identifier: str | Reference,
+    ancestor_prefix: str | None = None,
+    ancestor_identifier: str | None = None,
+    /,
+    **kwargs: Unpack[HierarchyKwargs],
 ) -> bool:
     """Check that the first identifier has the second as a descendent.
-    Check that go:0070246 ! natural killer cell apoptotic process is a
-    descendant of go:0006915 ! apoptotic process::
+    :param prefix: The prefix for the descendant
+    :param identifier: The local unique identifier for the descendant
+    :param ancestor_prefix: The prefix for the ancestor
+    :param ancestor_identifier: The local unique identifier for the ancestor
+    :param kwargs: Keyword arguments for :func:`get_hierarchy`
+    :return: If the decendant has the given ancestor
+    Check that ``GO:0070246`` (natural killer cell apoptotic process) is a descendant of
+    ``GO:0006915`` (apoptotic process)
+    >>> nk_apoptosis = Reference.from_curie(
+    ...     "GO:0070246", name="natural killer cell apoptotic process"
+    ... )
+    >>> apoptosis = Reference.from_curie("GO:0006915", name="apoptotic process")
+    >>> assert is_descendent(nk_apoptosis, apoptosis)
+    Using deprecated old-style arguments:
     >>> assert is_descendent("go", "0070246", "go", "0006915")
     """
-    descendants = get_descendants(ancestor_prefix, ancestor_identifier, version=version)
-    return descendants is not None and f"{prefix}:{identifier}" in descendants
+    descendant, ancestor = _get_double_reference(
+        prefix, identifier, ancestor_prefix, ancestor_identifier
+    )
+    descendants = get_descendants(ancestor, **kwargs)
+    return descendants is not None and descendant in descendants
 @lru_cache
 def get_descendants(
-    prefix: str,
-    identifier: Optional[str] = None,
-    include_part_of: bool = True,
-    include_has_member: bool = False,
-    use_tqdm: bool = False,
-    force: bool = False,
-    **kwargs,
-) -> Optional[set[str]]:
+    prefix: str | Reference | ReferenceTuple,
+    identifier: str | None = None,
+    /,
+    **kwargs: Unpack[HierarchyKwargs],
+) -> set[Reference] | None:
     """Get all the descendants (children) of the term as CURIEs."""
-    curie, prefix, identifier = _pic(prefix, identifier)
-    hierarchy = get_hierarchy(
-        prefix=prefix,
-        include_has_member=include_has_member,
-        include_part_of=include_part_of,
-        use_tqdm=use_tqdm,
-        force=force,
-        **kwargs,
-    )
-    if curie not in hierarchy:
+    t = _get_pi(prefix, identifier)
+    hierarchy = get_hierarchy(prefix=t.prefix, **kwargs)
+    if t not in hierarchy:
         return None
-    return nx.ancestors(hierarchy, curie)  # note this is backwards
-def _pic(prefix, identifier=None) -> tuple[str, str, str]:
-    if identifier is None:
-        curie = prefix
-        prefix, identifier = prefix.split(":")
-    else:
-        curie = f"{prefix}:{identifier}"
-    return curie, prefix, identifier
+    return nx.ancestors(hierarchy, t)  # note this is backwards
 @lru_cache
 def get_children(
-    prefix: str,
-    identifier: Optional[str] = None,
-    include_part_of: bool = True,
-    include_has_member: bool = False,
-    use_tqdm: bool = False,
-    force: bool = False,
-    **kwargs,
-) -> Optional[set[str]]:
+    prefix: str | Reference | ReferenceTuple,
+    identifier: str | None = None,
+    /,
+    **kwargs: Unpack[HierarchyKwargs],
+) -> set[Reference] | None:
     """Get all the descendants (children) of the term as CURIEs."""
-    curie, prefix, identifier = _pic(prefix, identifier)
-    hierarchy = get_hierarchy(
-        prefix=prefix,
-        include_has_member=include_has_member,
-        include_part_of=include_part_of,
-        use_tqdm=use_tqdm,
-        force=force,
-        **kwargs,
-    )
-    if curie not in hierarchy:
+    t = _get_pi(prefix, identifier)
+    hierarchy = get_hierarchy(prefix=t.prefix, **kwargs)
+    if t not in hierarchy:
         return None
-    return set(hierarchy.predecessors(curie))
+    return set(hierarchy.predecessors(t))
+# docstr-coverage:excused `overload`
+@overload
+def has_ancestor(
+    prefix: str,
+    identifier: str,
+    ancestor_prefix: str = ...,
+    ancestor_identifier: str = ...,
+    /,
+    **kwargs: Unpack[HierarchyKwargs],
+) -> bool: ...
+# docstr-coverage:excused `overload`
+@overload
+def has_ancestor(
+    descendant: Reference,
+    ancestor: Reference,
+    _1: None = ...,
+    _2: None = ...,
+    /,
+    **kwargs: Unpack[HierarchyKwargs],
+) -> bool: ...
 def has_ancestor(
-    prefix, identifier, ancestor_prefix, ancestor_identifier, *, version: Optional[str] = None
+    prefix: str | Reference,
+    identifier: str | Reference,
+    ancestor_prefix: str | None = None,
+    ancestor_identifier: str | None = None,
+    /,
+    **kwargs: Unpack[HierarchyKwargs],
 ) -> bool:
     """Check that the first identifier has the second as an ancestor.
-    Check that go:0008219 ! cell death is an ancestor of go:0006915 ! apoptotic process::
+    :param prefix: The prefix for the descendant
+    :param identifier: The local unique identifier for the descendant
+    :param ancestor_prefix: The prefix for the ancestor
+    :param ancestor_identifier: The local unique identifier for the ancestor
+    :param kwargs: Keyword arguments for :func:`get_hierarchy`
+    :return: If the decendant has the given ancestor
+    Check that ``GO:0008219`` (cell death) is an ancestor of ``GO:0006915``
+    (apoptotic process):
+    >>> apoptosis = Reference.from_curie("GO:0006915", name="apoptotic process")
+    >>> cell_death = Reference.from_curie("GO:0008219", name="cell death")
+    >>> assert has_ancestor(apoptosis, cell_death)
+    The same, using the deprecated argumentation style:
     >>> assert has_ancestor("go", "0006915", "go", "0008219")
     """
-    ancestors = get_ancestors(prefix, identifier, version=version)
-    return ancestors is not None and f"{ancestor_prefix}:{ancestor_identifier}" in ancestors
+    descendant, ancestor = _get_double_reference(
+        prefix, identifier, ancestor_prefix, ancestor_identifier
+    )
+    ancestors = get_ancestors(descendant, **kwargs)
+    return ancestors is not None and ancestor in ancestors
+def _get_double_reference(
+    a: str | Reference, b: str | Reference, c: str | None, d: str | None
+) -> tuple[Reference, Reference]:
+    if isinstance(a, Reference) and isinstance(b, Reference):
+        return a, b
+    elif all(isinstance(x, str) for x in (a, b, c, d)):
+        warnings.warn("passing strings is deprecated", DeprecationWarning, stacklevel=2)
+        return Reference(prefix=a, identifier=b), Reference(prefix=c, identifier=d)
+    else:
+        raise TypeError
 @lru_cache
 def get_ancestors(
-    prefix: str,
-    identifier: Optional[str] = None,
-    include_part_of: bool = True,
-    include_has_member: bool = False,
-    use_tqdm: bool = False,
-    force: bool = False,
-    **kwargs,
-) -> Optional[set[str]]:
+    prefix: str | Reference | ReferenceTuple,
+    identifier: str | None = None,
+    /,
+    **kwargs: Unpack[HierarchyKwargs],
+) -> set[Reference] | None:
     """Get all the ancestors (parents) of the term as CURIEs."""
-    curie, prefix, identifier = _pic(prefix, identifier)
-    hierarchy = get_hierarchy(
-        prefix=prefix,
-        include_has_member=include_has_member,
-        include_part_of=include_part_of,
-        use_tqdm=use_tqdm,
-        force=force,
-        **kwargs,
-    )
-    if curie not in hierarchy:
+    t = _get_pi(prefix, identifier)
+    hierarchy = get_hierarchy(prefix=t.prefix, **kwargs)
+    if t not in hierarchy:
         return None
-    return nx.descendants(hierarchy, curie)  # note this is backwards
+    return nx.descendants(hierarchy, t)  # note this is backwards
 def get_subhierarchy(
-    prefix: str,
-    identifier: Optional[str] = None,
-    include_part_of: bool = True,
-    include_has_member: bool = False,
-    use_tqdm: bool = False,
-    force: bool = False,
-    **kwargs,
+    prefix: str | Reference | ReferenceTuple,
+    identifier: str | None = None,
+    /,
+    **kwargs: Unpack[HierarchyKwargs],
 ) -> nx.DiGraph:
     """Get the subhierarchy for a given node."""
-    curie, prefix, identifier = _pic(prefix, identifier)
-    hierarchy = get_hierarchy(
-        prefix=prefix,
-        include_has_member=include_has_member,
-        include_part_of=include_part_of,
-        use_tqdm=use_tqdm,
-        force=force,
-        **kwargs,
-    )
-    logger.info(
-        "getting descendants of %s:%s ! %s", prefix, identifier, get_name(prefix, identifier)
-    )
-    curies = nx.ancestors(hierarchy, curie)  # note this is backwards
+    t = _get_pi(prefix, identifier)
+    hierarchy = get_hierarchy(prefix=t.prefix, **kwargs)
+    logger.info("getting descendants of %s ! %s", t.curie, get_name(t))
+    descendants = set(nx.ancestors(hierarchy, t)) | {t}  # note this is backwards
     logger.info("inducing subgraph")
-    sg = hierarchy.subgraph(curies).copy()
+    sg = hierarchy.subgraph(descendants).copy()
     logger.info("subgraph has %d nodes/%d edges", sg.number_of_nodes(), sg.number_of_edges())
     return sg

pyobo/api/metadata.py CHANGED Viewed

@@ -1,15 +1,17 @@
 """High-level API for metadata."""
 import logging
-from collections.abc import Mapping
 from functools import lru_cache
-from typing import Optional
+from typing import Any, cast
-from .utils import get_version
+from typing_extensions import Unpack
+from .utils import get_version_from_kwargs
+from ..constants import GetOntologyKwargs, check_should_force
 from ..getters import get_ontology
 from ..identifier_utils import wrap_norm_prefix
 from ..utils.cache import cached_json
-from ..utils.path import prefix_cache_join
+from ..utils.path import CacheArtifact, get_cache_path
 __all__ = [
     "get_metadata",
@@ -20,21 +22,14 @@ logger = logging.getLogger(__name__)
 @lru_cache
 @wrap_norm_prefix
-def get_metadata(
-    prefix: str, *, force: bool = False, version: Optional[str] = None
-) -> Mapping[str, str]:
+def get_metadata(prefix: str, **kwargs: Unpack[GetOntologyKwargs]) -> dict[str, Any]:
     """Get metadata for the ontology."""
-    if version is None:
-        version = get_version(prefix)
-    path = prefix_cache_join(prefix, name="metadata.json", version=version)
-    @cached_json(path=path, force=force)
-    def _get_json() -> Mapping[str, str]:
-        if force:
-            logger.debug("[%s] forcing reload for metadata", prefix)
-        else:
-            logger.debug("[%s] no cached metadata found. getting from OBO loader", prefix)
-        ontology = get_ontology(prefix, force=force, version=version)
+    version = get_version_from_kwargs(prefix, kwargs)
+    path = get_cache_path(prefix, CacheArtifact.metadata, version=version)
+    @cached_json(path=path, force=check_should_force(kwargs))
+    def _get_json() -> dict[str, Any]:
+        ontology = get_ontology(prefix, **kwargs)
         return ontology.get_metadata()
-    return _get_json()
+    return cast(dict[str, Any], _get_json())

pyobo 0.11.2__py3-none-any.whl → 0.12.0__py3-none-any.whl

pyobo 0.11.2py3-none-any.whl → 0.12.0py3-none-any.whl