PyPI - pyobo - Versions diffs - 0.11.2__py3-none-any.whl → 0.12.1__py3-none-any.whl - Mend

pyobo 0.11.2py3-none-any.whl → 0.12.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (228) hide show

pyobo/.DS_Store +0 -0
pyobo/__init__.py +95 -20
pyobo/__main__.py +0 -0
pyobo/api/__init__.py +81 -10
pyobo/api/alts.py +52 -42
pyobo/api/combine.py +39 -0
pyobo/api/edges.py +68 -0
pyobo/api/hierarchy.py +231 -203
pyobo/api/metadata.py +14 -19
pyobo/api/names.py +207 -127
pyobo/api/properties.py +117 -117
pyobo/api/relations.py +68 -94
pyobo/api/species.py +24 -21
pyobo/api/typedefs.py +11 -11
pyobo/api/utils.py +66 -13
pyobo/api/xrefs.py +107 -114
pyobo/cli/__init__.py +0 -0
pyobo/cli/cli.py +35 -50
pyobo/cli/database.py +210 -160
pyobo/cli/database_utils.py +155 -0
pyobo/cli/lookup.py +163 -195
pyobo/cli/utils.py +19 -6
pyobo/constants.py +102 -3
pyobo/getters.py +209 -191
pyobo/gilda_utils.py +52 -250
pyobo/identifier_utils/__init__.py +33 -0
pyobo/identifier_utils/api.py +305 -0
pyobo/identifier_utils/preprocessing.json +873 -0
pyobo/identifier_utils/preprocessing.py +27 -0
pyobo/identifier_utils/relations/__init__.py +8 -0
pyobo/identifier_utils/relations/api.py +162 -0
pyobo/identifier_utils/relations/data.json +5824 -0
pyobo/identifier_utils/relations/data_owl.json +57 -0
pyobo/identifier_utils/relations/data_rdf.json +1 -0
pyobo/identifier_utils/relations/data_rdfs.json +7 -0
pyobo/mocks.py +9 -6
pyobo/ner/__init__.py +9 -0
pyobo/ner/api.py +72 -0
pyobo/ner/normalizer.py +33 -0
pyobo/obographs.py +48 -40
pyobo/plugins.py +5 -4
pyobo/py.typed +0 -0
pyobo/reader.py +1354 -395
pyobo/reader_utils.py +155 -0
pyobo/resource_utils.py +42 -22
pyobo/resources/__init__.py +0 -0
pyobo/resources/goc.py +75 -0
pyobo/resources/goc.tsv +188 -0
pyobo/resources/ncbitaxon.py +4 -5
pyobo/resources/ncbitaxon.tsv.gz +0 -0
pyobo/resources/ro.py +3 -2
pyobo/resources/ro.tsv +0 -0
pyobo/resources/so.py +0 -0
pyobo/resources/so.tsv +0 -0
pyobo/sources/README.md +12 -8
pyobo/sources/__init__.py +52 -29
pyobo/sources/agrovoc.py +0 -0
pyobo/sources/antibodyregistry.py +11 -12
pyobo/sources/bigg/__init__.py +13 -0
pyobo/sources/bigg/bigg_compartment.py +81 -0
pyobo/sources/bigg/bigg_metabolite.py +229 -0
pyobo/sources/bigg/bigg_model.py +46 -0
pyobo/sources/bigg/bigg_reaction.py +77 -0
pyobo/sources/biogrid.py +1 -2
pyobo/sources/ccle.py +7 -12
pyobo/sources/cgnc.py +9 -6
pyobo/sources/chebi.py +1 -1
pyobo/sources/chembl/__init__.py +9 -0
pyobo/sources/{chembl.py → chembl/chembl_compound.py} +13 -25
pyobo/sources/chembl/chembl_target.py +160 -0
pyobo/sources/civic_gene.py +55 -15
pyobo/sources/clinicaltrials.py +160 -0
pyobo/sources/complexportal.py +24 -24
pyobo/sources/conso.py +14 -22
pyobo/sources/cpt.py +0 -0
pyobo/sources/credit.py +1 -9
pyobo/sources/cvx.py +27 -5
pyobo/sources/depmap.py +9 -12
pyobo/sources/dictybase_gene.py +2 -7
pyobo/sources/drugbank/__init__.py +9 -0
pyobo/sources/{drugbank.py → drugbank/drugbank.py} +11 -16
pyobo/sources/{drugbank_salt.py → drugbank/drugbank_salt.py} +3 -8
pyobo/sources/drugcentral.py +17 -13
pyobo/sources/expasy.py +31 -34
pyobo/sources/famplex.py +13 -18
pyobo/sources/flybase.py +8 -13
pyobo/sources/gard.py +62 -0
pyobo/sources/geonames/__init__.py +9 -0
pyobo/sources/geonames/features.py +28 -0
pyobo/sources/{geonames.py → geonames/geonames.py} +87 -26
pyobo/sources/geonames/utils.py +115 -0
pyobo/sources/gmt_utils.py +6 -7
pyobo/sources/go.py +20 -13
pyobo/sources/gtdb.py +154 -0
pyobo/sources/gwascentral/__init__.py +9 -0
pyobo/sources/{gwascentral_phenotype.py → gwascentral/gwascentral_phenotype.py} +5 -7
pyobo/sources/{gwascentral_study.py → gwascentral/gwascentral_study.py} +1 -7
pyobo/sources/hgnc/__init__.py +9 -0
pyobo/sources/{hgnc.py → hgnc/hgnc.py} +56 -70
pyobo/sources/{hgncgenefamily.py → hgnc/hgncgenefamily.py} +8 -18
pyobo/sources/icd/__init__.py +9 -0
pyobo/sources/{icd10.py → icd/icd10.py} +35 -37
pyobo/sources/icd/icd11.py +148 -0
pyobo/sources/{icd_utils.py → icd/icd_utils.py} +66 -20
pyobo/sources/interpro.py +4 -9
pyobo/sources/itis.py +0 -5
pyobo/sources/kegg/__init__.py +0 -0
pyobo/sources/kegg/api.py +16 -38
pyobo/sources/kegg/genes.py +9 -20
pyobo/sources/kegg/genome.py +1 -7
pyobo/sources/kegg/pathway.py +9 -21
pyobo/sources/mesh.py +58 -24
pyobo/sources/mgi.py +3 -10
pyobo/sources/mirbase/__init__.py +11 -0
pyobo/sources/{mirbase.py → mirbase/mirbase.py} +8 -11
pyobo/sources/{mirbase_constants.py → mirbase/mirbase_constants.py} +0 -0
pyobo/sources/{mirbase_family.py → mirbase/mirbase_family.py} +4 -8
pyobo/sources/{mirbase_mature.py → mirbase/mirbase_mature.py} +3 -7
pyobo/sources/msigdb.py +74 -39
pyobo/sources/ncbi/__init__.py +9 -0
pyobo/sources/ncbi/ncbi_gc.py +162 -0
pyobo/sources/{ncbigene.py → ncbi/ncbigene.py} +18 -19
pyobo/sources/nih_reporter.py +60 -0
pyobo/sources/nlm/__init__.py +9 -0
pyobo/sources/nlm/nlm_catalog.py +48 -0
pyobo/sources/nlm/nlm_publisher.py +36 -0
pyobo/sources/nlm/utils.py +116 -0
pyobo/sources/npass.py +6 -8
pyobo/sources/omim_ps.py +11 -4
pyobo/sources/pathbank.py +4 -8
pyobo/sources/pfam/__init__.py +9 -0
pyobo/sources/{pfam.py → pfam/pfam.py} +3 -8
pyobo/sources/{pfam_clan.py → pfam/pfam_clan.py} +2 -7
pyobo/sources/pharmgkb/__init__.py +15 -0
pyobo/sources/pharmgkb/pharmgkb_chemical.py +89 -0
pyobo/sources/pharmgkb/pharmgkb_disease.py +77 -0
pyobo/sources/pharmgkb/pharmgkb_gene.py +108 -0
pyobo/sources/pharmgkb/pharmgkb_pathway.py +63 -0
pyobo/sources/pharmgkb/pharmgkb_variant.py +84 -0
pyobo/sources/pharmgkb/utils.py +86 -0
pyobo/sources/pid.py +1 -6
pyobo/sources/pombase.py +6 -10
pyobo/sources/pubchem.py +4 -9
pyobo/sources/reactome.py +5 -11
pyobo/sources/rgd.py +11 -16
pyobo/sources/rhea.py +37 -36
pyobo/sources/ror.py +69 -42
pyobo/sources/selventa/__init__.py +0 -0
pyobo/sources/selventa/schem.py +4 -7
pyobo/sources/selventa/scomp.py +1 -6
pyobo/sources/selventa/sdis.py +4 -7
pyobo/sources/selventa/sfam.py +1 -6
pyobo/sources/sgd.py +6 -11
pyobo/sources/signor/__init__.py +7 -0
pyobo/sources/signor/download.py +41 -0
pyobo/sources/signor/signor_complexes.py +105 -0
pyobo/sources/slm.py +12 -15
pyobo/sources/umls/__init__.py +7 -1
pyobo/sources/umls/__main__.py +0 -0
pyobo/sources/umls/get_synonym_types.py +20 -4
pyobo/sources/umls/sty.py +57 -0
pyobo/sources/umls/synonym_types.tsv +1 -1
pyobo/sources/umls/umls.py +18 -22
pyobo/sources/unimod.py +46 -0
pyobo/sources/uniprot/__init__.py +1 -1
pyobo/sources/uniprot/uniprot.py +40 -32
pyobo/sources/uniprot/uniprot_ptm.py +4 -34
pyobo/sources/utils.py +3 -2
pyobo/sources/wikipathways.py +7 -10
pyobo/sources/zfin.py +5 -10
pyobo/ssg/__init__.py +12 -16
pyobo/ssg/base.html +0 -0
pyobo/ssg/index.html +26 -13
pyobo/ssg/term.html +12 -2
pyobo/ssg/typedef.html +0 -0
pyobo/struct/__init__.py +54 -8
pyobo/struct/functional/__init__.py +1 -0
pyobo/struct/functional/dsl.py +2572 -0
pyobo/struct/functional/macros.py +423 -0
pyobo/struct/functional/obo_to_functional.py +385 -0
pyobo/struct/functional/ontology.py +272 -0
pyobo/struct/functional/utils.py +112 -0
pyobo/struct/reference.py +331 -136
pyobo/struct/struct.py +1484 -657
pyobo/struct/struct_utils.py +1078 -0
pyobo/struct/typedef.py +162 -210
pyobo/struct/utils.py +12 -5
pyobo/struct/vocabulary.py +138 -0
pyobo/utils/__init__.py +0 -0
pyobo/utils/cache.py +16 -15
pyobo/utils/io.py +51 -41
pyobo/utils/iter.py +5 -5
pyobo/utils/misc.py +41 -53
pyobo/utils/ndex_utils.py +0 -0
pyobo/utils/path.py +73 -70
pyobo/version.py +3 -3
pyobo-0.12.1.dist-info/METADATA +671 -0
pyobo-0.12.1.dist-info/RECORD +201 -0
pyobo-0.12.1.dist-info/WHEEL +4 -0
{pyobo-0.11.2.dist-info → pyobo-0.12.1.dist-info}/entry_points.txt +1 -0
pyobo-0.12.1.dist-info/licenses/LICENSE +21 -0
pyobo/aws.py +0 -162
pyobo/cli/aws.py +0 -47
pyobo/identifier_utils.py +0 -142
pyobo/normalizer.py +0 -232
pyobo/registries/__init__.py +0 -16
pyobo/registries/metaregistry.json +0 -507
pyobo/registries/metaregistry.py +0 -135
pyobo/sources/icd11.py +0 -105
pyobo/xrefdb/__init__.py +0 -1
pyobo/xrefdb/canonicalizer.py +0 -214
pyobo/xrefdb/priority.py +0 -59
pyobo/xrefdb/sources/__init__.py +0 -60
pyobo/xrefdb/sources/biomappings.py +0 -36
pyobo/xrefdb/sources/cbms2019.py +0 -91
pyobo/xrefdb/sources/chembl.py +0 -83
pyobo/xrefdb/sources/compath.py +0 -82
pyobo/xrefdb/sources/famplex.py +0 -64
pyobo/xrefdb/sources/gilda.py +0 -50
pyobo/xrefdb/sources/intact.py +0 -113
pyobo/xrefdb/sources/ncit.py +0 -133
pyobo/xrefdb/sources/pubchem.py +0 -27
pyobo/xrefdb/sources/wikidata.py +0 -116
pyobo/xrefdb/xrefs_pipeline.py +0 -180
pyobo-0.11.2.dist-info/METADATA +0 -711
pyobo-0.11.2.dist-info/RECORD +0 -157
pyobo-0.11.2.dist-info/WHEEL +0 -5
pyobo-0.11.2.dist-info/top_level.txt +0 -1

pyobo/cli/lookup.py CHANGED Viewed

@@ -2,17 +2,20 @@
 import json
 import sys
-from typing import Optional
+from collections.abc import Mapping
 import bioregistry
 import click
 from more_click import verbose_option
+from typing_extensions import Unpack
 from .utils import (
+    Clickable,
     echo_df,
     force_option,
-    no_strict_option,
+    force_process_option,
     prefix_argument,
+    strict_option,
     version_option,
 )
 from ..api import (
@@ -28,15 +31,17 @@ from ..api import (
     get_id_synonyms_mapping,
     get_id_to_alts,
     get_ids,
+    get_mappings_df,
     get_metadata,
     get_name,
-    get_name_by_curie,
     get_properties_df,
     get_relations_df,
     get_typedef_df,
     get_xrefs_df,
 )
-from ..identifier_utils import normalize_curie
+from ..constants import LookupKwargs
+from ..getters import get_ontology
+from ..struct.reference import _parse_str_or_curie_or_uri
 __all__ = [
     "lookup",
@@ -48,150 +53,123 @@ def lookup():
     """Lookup resources."""
-@lookup.command()
-@prefix_argument
+def lookup_annotate(f: Clickable) -> Clickable:
+    """Add appropriate decorators to lookup CLI functions."""
+    for decorator in [
+        lookup.command(),
+        prefix_argument,
+        verbose_option,
+        force_option,
+        force_process_option,
+        strict_option,
+        version_option,
+    ]:
+        f = decorator(f)
+    return f
+identifier_option = click.option("-i", "--identifier")
+@lookup_annotate
 @click.option("-t", "--target")
-@verbose_option
-@force_option
-@no_strict_option
-@version_option
-def xrefs(prefix: str, target: str, force: bool, no_strict: bool, version: Optional[str]):
+def xrefs(target: str, **kwargs: Unpack[LookupKwargs]) -> None:
     """Page through xrefs for the given namespace to the second given namespace."""
     if target:
-        target = bioregistry.normalize_prefix(target)
-        filtered_xrefs = get_filtered_xrefs(
-            prefix, target, force=force, strict=not no_strict, version=version
-        )
+        target_norm = bioregistry.normalize_prefix(target)
+        filtered_xrefs = get_filtered_xrefs(xref_prefix=target_norm, **kwargs)
         click.echo_via_pager(
             "\n".join(f"{identifier}\t{_xref}" for identifier, _xref in filtered_xrefs.items())
         )
     else:
-        all_xrefs_df = get_xrefs_df(prefix, force=force, strict=not no_strict, version=version)
+        all_xrefs_df = get_xrefs_df(**kwargs)
         echo_df(all_xrefs_df)
-@lookup.command()
-@prefix_argument
-@verbose_option
-@force_option
-@version_option
-def metadata(prefix: str, force: bool, version: Optional[str]):
+@lookup_annotate
+@click.option("--include-names", is_flag=True)
+@click.option("-t", "--target")
+def mappings(include_names: bool, target: str | None, **kwargs: Unpack[LookupKwargs]) -> None:
+    """Page through mappings for the given namespace."""
+    mappings_df = get_mappings_df(names=include_names, **kwargs)
+    if target:
+        target_norm = bioregistry.normalize_prefix(target)
+        if target_norm is None:
+            raise ValueError
+        idx = mappings_df["object_id"].map(
+            lambda x: bioregistry.normalize_prefix(x.split(":")[0]) == target_norm
+        )
+        mappings_df = mappings_df[idx]
+    echo_df(mappings_df)
+@lookup_annotate
+def metadata(**kwargs: Unpack[LookupKwargs]) -> None:
     """Print the metadata for the given namespace."""
-    metadata = get_metadata(prefix, force=force, version=version)
+    metadata = get_metadata(**kwargs)
     click.echo(json.dumps(metadata, indent=2))
-@lookup.command()
-@prefix_argument
-@verbose_option
-@force_option
-@no_strict_option
-@version_option
-def ids(prefix: str, force: bool, no_strict: bool, version: Optional[str]):
+@lookup_annotate
+def ids(**kwargs: Unpack[LookupKwargs]) -> None:
     """Page through the identifiers of entities in the given namespace."""
-    id_list = get_ids(prefix, force=force, strict=not no_strict, version=version)
-    click.echo_via_pager("\n".join(id_list))
-@lookup.command()
-@prefix_argument
-@verbose_option
-@force_option
-@no_strict_option
-@click.option("-i", "--identifier")
-@version_option
-def names(
-    prefix: str, identifier: Optional[str], force: bool, no_strict: bool, version: Optional[str]
-):
-    """Page through the identifiers and names of entities in the given namespace."""
-    id_to_name = get_id_name_mapping(prefix, force=force, strict=not no_strict, version=version)
-    if identifier is None:
-        _help_page_mapping(id_to_name)
+    id_list = get_ids(**kwargs)
+    if not id_list:
+        click.secho("no data", fg="red")
     else:
-        name = id_to_name.get(identifier)
-        if name is None:
-            click.secho(f"No name available for {identifier}", fg="red")
-        else:
-            click.echo(name)
-@lookup.command()
-@prefix_argument
-@verbose_option
-@force_option
-@no_strict_option
-@click.option("-i", "--identifier")
-@version_option
-def species(
-    prefix: str, identifier: Optional[str], force: bool, no_strict: bool, version: Optional[str]
-):
+        click.echo_via_pager("\n".join(id_list))
+@lookup_annotate
+@identifier_option
+def names(identifier: str | None, **kwargs: Unpack[LookupKwargs]) -> None:
+    """Page through the identifiers and names of entities in the given namespace."""
+    id_to_name = get_id_name_mapping(**kwargs)
+    _help_page_mapping(id_to_name, identifier=identifier)
+@lookup_annotate
+@identifier_option
+def species(identifier: str | None, **kwargs: Unpack[LookupKwargs]) -> None:
     """Page through the identifiers and species of entities in the given namespace."""
-    id_to_species = get_id_species_mapping(
-        prefix, force=force, strict=not no_strict, version=version
-    )
-    if identifier is None:
-        _help_page_mapping(id_to_species)
-    else:
-        species = id_to_species.get(identifier)
-        if species is None:
-            click.secho(f"No species available for {identifier}", fg="red")
-        else:
-            click.echo(species)
+    id_to_species = get_id_species_mapping(**kwargs)
+    _help_page_mapping(id_to_species, identifier=identifier)
-@lookup.command()
-@prefix_argument
-@verbose_option
-@force_option
-@click.option("-i", "--identifier")
-@version_option
-def definitions(prefix: str, identifier: Optional[str], force: bool, version: Optional[str]):
+@lookup_annotate
+@identifier_option
+def definitions(identifier: str | None, **kwargs: Unpack[LookupKwargs]) -> None:
     """Page through the identifiers and definitions of entities in the given namespace."""
-    id_to_definition = get_id_definition_mapping(prefix, force=force, version=version)
-    if identifier is None:
-        _help_page_mapping(id_to_definition)
-    else:
-        definition = id_to_definition.get(identifier)
-        if definition is None:
-            click.secho(f"No definition available for {identifier}", fg="red")
-        else:
-            click.echo(definition)
+    id_to_definition = get_id_definition_mapping(**kwargs)
+    _help_page_mapping(id_to_definition, identifier=identifier)
-@lookup.command()
-@prefix_argument
-@verbose_option
-@force_option
-@version_option
-def typedefs(prefix: str, force: bool, version: Optional[str]):
+@lookup_annotate
+def typedefs(**kwargs: Unpack[LookupKwargs]) -> None:
     """Page through the identifiers and names of typedefs in the given namespace."""
-    df = get_typedef_df(prefix, force=force, version=version)
+    df = get_typedef_df(**kwargs)
     echo_df(df)
-def _help_page_mapping(id_to_name):
-    click.echo_via_pager("\n".join("\t".join(item) for item in id_to_name.items()))
+def _help_page_mapping(id_to_name: Mapping[str, str], *, identifier: str | None = None) -> None:
+    if not id_to_name:
+        click.secho("no data", fg="red")
+    elif identifier:
+        value = id_to_name.get(identifier)
+        if value:
+            click.echo(value)
+        else:
+            click.secho(f"no data for {identifier}", fg="red")
+    else:
+        click.echo_via_pager("\n".join("\t".join(item) for item in id_to_name.items()))
-@lookup.command()
-@prefix_argument
-@verbose_option
-@force_option
-@version_option
-def synonyms(prefix: str, force: bool, version: Optional[str]):
+@lookup_annotate
+@identifier_option
+def synonyms(identifier: str | None, **kwargs: Unpack[LookupKwargs]) -> None:
     """Page through the synonyms for entities in the given namespace."""
-    if ":" in prefix:
-        _prefix, identifier = normalize_curie(prefix)
-        if _prefix is None or identifier is None:
-            click.secho(f"could not normalize {prefix}")
-            return sys.exit(1)
-        name = get_name(_prefix, identifier)
-        id_to_synonyms = get_id_synonyms_mapping(_prefix, force=force)
-        click.echo(f"Synonyms for {_prefix}:{identifier} ! {name}")
-        for synonym in id_to_synonyms.get(identifier, []):
-            click.echo(synonym)
-    else:  # it's a prefix
-        id_to_synonyms = get_id_synonyms_mapping(prefix, force=force, version=version)
+    id_to_synonyms = get_id_synonyms_mapping(**kwargs)
+    if identifier is None:
         click.echo_via_pager(
             "\n".join(
                 f"{identifier}\t{_synonym}"
@@ -199,136 +177,126 @@ def synonyms(prefix: str, force: bool, version: Optional[str]):
                 for _synonym in _synonyms
             )
         )
+    else:
+        synonyms = id_to_synonyms.get(identifier, [])
+        if not synonyms:
+            click.secho(f"No synonyms available for {identifier}", fg="red")
+        else:
+            click.echo_via_pager("\n".join(synonyms))
-@lookup.command()
-@prefix_argument
+@lookup_annotate
 @click.option(
     "--relation", help="CURIE for the relationship or just the ID if local to the ontology"
 )
 @click.option("--target", help="Prefix for the target")
-@verbose_option
-@no_strict_option
-@force_option
 @click.option("--summarize", is_flag=True)
-@version_option
 def relations(
-    prefix: str,
     relation: str,
     target: str,
-    force: bool,
-    no_strict: bool,
     summarize: bool,
-    version: Optional[str],
-):
+    **kwargs: Unpack[LookupKwargs],
+) -> None:
     """Page through the relations for entities in the given namespace."""
     if relation is None:
-        relations_df = get_relations_df(prefix, force=force, strict=not no_strict, version=version)
+        relations_df = get_relations_df(**kwargs)
         if summarize:
             click.echo(relations_df[relations_df.columns[2]].value_counts())
         else:
             echo_df(relations_df)
     else:
-        curie = normalize_curie(relation)
-        if curie[1] is None:  # that's the identifier
-            click.secho(f"not valid curie, assuming local to {prefix}", fg="yellow")
-            curie = prefix, relation
+        relation_reference = _parse_str_or_curie_or_uri(relation, strict=False)
+        if relation_reference is None:
+            click.secho(f"not a valid curie: {relation}", fg="red")
+            raise sys.exit(1)
         if target is not None:
             norm_target = bioregistry.normalize_prefix(target)
             if norm_target is None:
                 raise ValueError
             relations_df = get_filtered_relations_df(
-                prefix, relation=curie, force=force, strict=not no_strict, target=norm_target
+                relation=relation_reference,
+                target=norm_target,
+                **kwargs,
             )
         else:
             raise NotImplementedError(f"can not filter by target prefix {target}")
-@lookup.command()
-@prefix_argument
+@lookup_annotate
 @click.option("--include-part-of", is_flag=True)
 @click.option("--include-has-member", is_flag=True)
-@verbose_option
-@force_option
-@version_option
 def hierarchy(
-    prefix: str,
     include_part_of: bool,
     include_has_member: bool,
-    force: bool,
-    version: Optional[str],
-):
+    **kwargs: Unpack[LookupKwargs],
+) -> None:
     """Page through the hierarchy for entities in the namespace."""
     h = get_hierarchy(
-        prefix,
         include_part_of=include_part_of,
         include_has_member=include_has_member,
-        force=force,
-        version=version,
+        **kwargs,
     )
-    click.echo_via_pager("\n".join("\t".join(row) for row in h.edges()))
+    if h.number_of_edges() == 0:
+        click.secho("no data", fg="red")
+    else:
+        click.echo_via_pager("\n".join(f"{u.curie}\t{v.curie}" for u, v in h.edges()))
-@lookup.command()
-@prefix_argument
+@lookup_annotate
 @click.argument("identifier")
-@verbose_option
-@force_option
-@version_option
-def ancestors(prefix: str, identifier: str, force: bool, version: Optional[str]):
+def ancestors(
+    identifier: str,
+    **kwargs: Unpack[LookupKwargs],
+) -> None:
     """Look up ancestors."""
-    curies = get_ancestors(prefix=prefix, identifier=identifier, force=force, version=version)
-    for curie in sorted(curies or []):
-        click.echo(f"{curie}\t{get_name_by_curie(curie, version=version)}")
+    # note, prefix is passed via kwargs
+    ancestors = get_ancestors(identifier=identifier, **kwargs)
+    for ancestor in sorted(ancestors or []):
+        click.echo(f"{ancestor.curie}\t{get_name(ancestor, version=kwargs['version'])}")
-@lookup.command()
-@prefix_argument
+@lookup_annotate
 @click.argument("identifier")
-@verbose_option
-@force_option
-@version_option
-def descendants(prefix: str, identifier: str, force: bool, version: Optional[str]):
+def descendants(
+    identifier: str,
+    **kwargs: Unpack[LookupKwargs],
+) -> None:
     """Look up descendants."""
-    curies = get_descendants(prefix=prefix, identifier=identifier, force=force, version=version)
-    for curie in sorted(curies or []):
-        click.echo(f"{curie}\t{get_name_by_curie(curie, version=version)}")
+    # note, prefix is passed via kwargs
+    descendants = get_descendants(identifier=identifier, **kwargs)
+    for descendant in sorted(descendants or []):
+        click.echo(f"{descendant.curie}\t{get_name(descendant, version=kwargs['version'])}")
-@lookup.command()
-@prefix_argument
+@lookup_annotate
 @click.option("-k", "--key")
-@verbose_option
-@force_option
-@version_option
-def properties(prefix: str, key: Optional[str], force: bool, version: Optional[str]):
+def properties(
+    key: str | None,
+    **kwargs: Unpack[LookupKwargs],
+) -> None:
     """Page through the properties for entities in the given namespace."""
     if key is None:
-        properties_df = get_properties_df(prefix, force=force, version=version)
+        properties_df = get_properties_df(**kwargs)
     else:
-        properties_df = get_filtered_properties_df(prefix, prop=key, force=force)
+        properties_df = get_filtered_properties_df(prop=key, **kwargs)
     echo_df(properties_df)
-@lookup.command()
-@prefix_argument
-@verbose_option
-@force_option
-@click.option("-i", "--identifier")
-@version_option
-def alts(prefix: str, identifier: Optional[str], force: bool, version: Optional[str]):
+@lookup_annotate
+@identifier_option
+def alts(
+    identifier: str | None,
+    **kwargs: Unpack[LookupKwargs],
+) -> None:
     """Page through alt ids in a namespace."""
-    id_to_alts = get_id_to_alts(prefix, force=force, version=version)
-    if identifier is None:
-        click.echo_via_pager(
-            "\n".join(
-                f"{identifier}\t{alt}" for identifier, alts in id_to_alts.items() for alt in alts
-            )
-        )
-    else:
-        _alts = id_to_alts.get(identifier)
-        if _alts is None:
-            click.secho(f"No alternate identifiers for {identifier}", fg="red")
-        else:
-            click.echo("\n".join(_alts))
+    id_to_alts = get_id_to_alts(**kwargs)
+    _help_page_mapping(id_to_alts, identifier=identifier)
+@lookup_annotate
+def prefixes(**kwargs: Unpack[LookupKwargs]) -> None:
+    """Page through prefixes appearing in an ontology."""
+    ontology = get_ontology(**kwargs)
+    for prefix in sorted(ontology._get_prefixes(), key=str.casefold):
+        click.echo(prefix)

pyobo/cli/utils.py CHANGED Viewed

@@ -2,6 +2,8 @@
 import datetime
 import pathlib
+from collections.abc import Callable
+from typing import TypeVar
 import click
 import pandas as pd
@@ -9,12 +11,14 @@ import pandas as pd
 from ..constants import DATABASE_DIRECTORY
 __all__ = [
-    "echo_df",
+    "Clickable",
     "directory_option",
-    "zenodo_option",
+    "echo_df",
     "force_option",
+    "force_process_option",
     "prefix_argument",
-    "no_strict_option",
+    "strict_option",
+    "zenodo_option",
 ]
@@ -37,12 +41,21 @@ directory_option = click.option(
     help=f"Build location. Defaults to {DATABASE_DIRECTORY}/<today>",
 )
 zenodo_option = click.option("--zenodo", is_flag=True, help="Automatically upload to zenodo")
-no_strict_option = click.option(
-    "-x", "--no-strict", is_flag=True, help="Turn off failure on bad CURIEs"
+strict_option = click.option(
+    "--strict/--no-strict",
+    default=False,
+    show_default=True,
+    help="Turn on or off failure on unparsable CURIEs",
 )
 prefix_argument = click.argument("prefix")
-force_option = click.option("-f", "--force", is_flag=True)
+force_option = click.option(
+    "-f", "--force", is_flag=True, help="Force re-downloading and re-processing"
+)
 version_option = click.option(
     "--version",
     help="Explicit version of the data. If not given, the most recent will be looked up.",
 )
+force_process_option = click.option(
+    "--force-process", is_flag=True, help="Force re-processing, but not necessarily re-downloading"
+)
+Clickable = TypeVar("Clickable", bound=Callable)

pyobo/constants.py CHANGED Viewed

@@ -1,13 +1,16 @@
 """Constants for PyOBO."""
+from __future__ import annotations
 import logging
 import re
 import pystow
+from typing_extensions import NotRequired, TypedDict
 __all__ = [
-    "RAW_DIRECTORY",
     "DATABASE_DIRECTORY",
+    "RAW_DIRECTORY",
     "SPECIES_REMAPPING",
 ]
@@ -19,6 +22,15 @@ RAW_DIRECTORY = RAW_MODULE.base
 DATABASE_MODULE = PYOBO_MODULE.module("database")
 DATABASE_DIRECTORY = DATABASE_MODULE.base
+#: The directory inside an ontology cache where
+#: large artifacts like OBO, OWL, JSON, etc. go
+BUILD_SUBDIRECTORY_NAME = "build"
+#: The directory inside an ontology cache where
+#: small caches for alts, xrefs, names, etc. go
+CACHE_SUBDIRECTORY_NAME = "cache"
+#: the directory for caching relations
+RELATION_SUBDIRECTORY_NAME = "relations"
 SPECIES_REMAPPING = {
     "Canis familiaris": "Canis lupus familiaris",
 }
@@ -29,7 +41,6 @@ GLOBAL_SKIP = {
     "resid",  # deprecated
     "adw",  # deprecated
 }
-GLOBAL_CHECK_IDS = False
 #: Default prefix
 DEFAULT_PREFIX = "debio"
@@ -79,7 +90,7 @@ TYPEDEFS_FILE = "typedefs.tsv.gz"
 SPECIES_RECORD = "5334738"
 SPECIES_FILE = "species.tsv.gz"
-NCBITAXON_PREFIX = "NCBITaxon"
+NCBITAXON_PREFIX = "ncbitaxon"
 DATE_FORMAT = "%d:%m:%Y %H:%M"
 PROVENANCE_PREFIXES = {
     "pubmed",
@@ -97,3 +108,91 @@ PROVENANCE_PREFIXES = {
     "isbn",
     "issn",
 }
+class DatabaseKwargs(TypedDict):
+    """Keyword arguments for database CLI functions."""
+    strict: bool
+    force: bool
+    force_process: bool
+    skip_pyobo: bool
+    skip_below: str | None
+    skip_set: set[str] | None
+    use_tqdm: bool
+class SlimGetOntologyKwargs(TypedDict):
+    """Keyword arguments for database CLI functions.
+    These arguments are global during iteration over _all_ ontologies, whereas the
+    additional ``version`` is added in the subclass below for specific instances when
+    only a single ontology is requested.
+    """
+    strict: NotRequired[bool]
+    force: NotRequired[bool]
+    force_process: NotRequired[bool]
+class GetOntologyKwargs(SlimGetOntologyKwargs):
+    """Represents the optional keyword arguments passed to :func:`pyobo.get_ontology`.
+    This dictionary doesn't contain ``prefix`` since this is always explicitly handled.
+    """
+    version: NotRequired[str | None]
+    cache: NotRequired[bool]
+    use_tqdm: NotRequired[bool]
+def check_should_force(data: GetOntologyKwargs) -> bool:
+    """Determine whether caching should be forced based on generic keyword arguments."""
+    # note that this could be applied to the superclass of GetOntologyKwargs
+    # but this function should only be used in the scope where GetOntologyKwargs
+    # is appropriate.
+    return data.get("force", False) or data.get("force_process", False)
+def check_should_cache(data: GetOntologyKwargs) -> bool:
+    """Determine whether caching should be done based on generic keyword arguments."""
+    return data.get("cache", True)
+def check_should_use_tqdm(data: GetOntologyKwargs) -> bool:
+    """Determine whether caching should be done based on generic keyword arguments."""
+    return data.get("use_tqdm", True)
+class LookupKwargs(GetOntologyKwargs):
+    """Represents all arguments passed to :func:`pyobo.get_ontology`.
+    This dictionary does contain the ``prefix`` since it's used in the scope of CLI
+    functions.
+    """
+    prefix: str
+class IterHelperHelperDict(SlimGetOntologyKwargs):
+    """Represents arguments needed when iterating over all ontologies.
+    The explicitly defind arguments in this typed dict are used for the loop function
+    :func:`iter_helper_helper` and the rest that are inherited get passed to
+    :func:`pyobo.get_ontology` in each iteration.
+    """
+    use_tqdm: bool
+    skip_below: str | None
+    skip_pyobo: bool
+    skip_set: set[str] | None
+#: from table 2 of the Functional OWL syntax definition
+#: at https://www.w3.org/TR/owl2-syntax/#IRIs
+DEFAULT_PREFIX_MAP = {
+    "rdfs": "http://www.w3.org/2000/01/rdf-schema#",
+    "rdf": "http://www.w3.org/1999/02/22-rdf-syntax-ns#",
+    "xsd": "http://www.w3.org/2001/XMLSchema#",
+    "owl": "http://www.w3.org/2002/07/owl#",
+}

pyobo 0.11.2__py3-none-any.whl → 0.12.1__py3-none-any.whl

pyobo 0.11.2py3-none-any.whl → 0.12.1py3-none-any.whl