PyPI - pyobo - Versions diffs - 0.10.11__py3-none-any.whl → 0.11.0__py3-none-any.whl - Mend

pyobo 0.10.11py3-none-any.whl → 0.11.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (152) hide show

pyobo/__init__.py +0 -2
pyobo/__main__.py +0 -2
pyobo/api/__init__.py +0 -2
pyobo/api/alts.py +6 -7
pyobo/api/hierarchy.py +14 -15
pyobo/api/metadata.py +3 -4
pyobo/api/names.py +51 -31
pyobo/api/properties.py +6 -7
pyobo/api/relations.py +12 -11
pyobo/api/species.py +5 -6
pyobo/api/typedefs.py +1 -3
pyobo/api/utils.py +63 -2
pyobo/api/xrefs.py +4 -5
pyobo/aws.py +3 -5
pyobo/cli/__init__.py +0 -2
pyobo/cli/aws.py +0 -2
pyobo/cli/cli.py +0 -4
pyobo/cli/database.py +1 -3
pyobo/cli/lookup.py +2 -4
pyobo/cli/utils.py +0 -2
pyobo/constants.py +0 -3
pyobo/getters.py +19 -26
pyobo/gilda_utils.py +28 -8
pyobo/identifier_utils.py +32 -15
pyobo/mocks.py +5 -6
pyobo/normalizer.py +24 -24
pyobo/obographs.py +3 -3
pyobo/plugins.py +3 -4
pyobo/py.typed +0 -0
pyobo/reader.py +19 -21
pyobo/registries/__init__.py +0 -2
pyobo/registries/metaregistry.py +6 -8
pyobo/resource_utils.py +1 -3
pyobo/resources/__init__.py +0 -2
pyobo/resources/ncbitaxon.py +2 -3
pyobo/resources/ro.py +2 -4
pyobo/sources/README.md +15 -0
pyobo/sources/__init__.py +2 -2
pyobo/sources/agrovoc.py +3 -3
pyobo/sources/antibodyregistry.py +4 -5
pyobo/sources/biogrid.py +7 -7
pyobo/sources/ccle.py +3 -4
pyobo/sources/cgnc.py +1 -3
pyobo/sources/chebi.py +2 -4
pyobo/sources/chembl.py +1 -3
pyobo/sources/civic_gene.py +2 -3
pyobo/sources/complexportal.py +3 -5
pyobo/sources/conso.py +2 -4
pyobo/sources/cpt.py +1 -3
pyobo/sources/credit.py +68 -0
pyobo/sources/cvx.py +1 -3
pyobo/sources/depmap.py +3 -4
pyobo/sources/dictybase_gene.py +1 -3
pyobo/sources/drugbank.py +6 -7
pyobo/sources/drugbank_salt.py +3 -4
pyobo/sources/drugcentral.py +5 -7
pyobo/sources/expasy.py +11 -12
pyobo/sources/famplex.py +3 -5
pyobo/sources/flybase.py +2 -4
pyobo/sources/geonames.py +28 -10
pyobo/sources/gmt_utils.py +5 -6
pyobo/sources/go.py +4 -6
pyobo/sources/gwascentral_phenotype.py +1 -3
pyobo/sources/gwascentral_study.py +2 -3
pyobo/sources/hgnc.py +8 -9
pyobo/sources/hgncgenefamily.py +2 -4
pyobo/sources/icd10.py +3 -4
pyobo/sources/icd11.py +3 -4
pyobo/sources/icd_utils.py +6 -7
pyobo/sources/interpro.py +3 -5
pyobo/sources/itis.py +1 -3
pyobo/sources/kegg/__init__.py +0 -2
pyobo/sources/kegg/api.py +3 -4
pyobo/sources/kegg/genes.py +3 -4
pyobo/sources/kegg/genome.py +1 -3
pyobo/sources/kegg/pathway.py +5 -6
pyobo/sources/mesh.py +19 -21
pyobo/sources/mgi.py +1 -3
pyobo/sources/mirbase.py +4 -6
pyobo/sources/mirbase_constants.py +0 -2
pyobo/sources/mirbase_family.py +1 -3
pyobo/sources/mirbase_mature.py +1 -3
pyobo/sources/msigdb.py +4 -5
pyobo/sources/ncbigene.py +3 -5
pyobo/sources/npass.py +2 -4
pyobo/sources/omim_ps.py +1 -3
pyobo/sources/pathbank.py +3 -5
pyobo/sources/pfam.py +1 -3
pyobo/sources/pfam_clan.py +1 -3
pyobo/sources/pid.py +3 -5
pyobo/sources/pombase.py +1 -3
pyobo/sources/pubchem.py +5 -6
pyobo/sources/reactome.py +2 -4
pyobo/sources/rgd.py +3 -4
pyobo/sources/rhea.py +9 -10
pyobo/sources/ror.py +69 -22
pyobo/sources/selventa/__init__.py +0 -2
pyobo/sources/selventa/schem.py +1 -3
pyobo/sources/selventa/scomp.py +1 -3
pyobo/sources/selventa/sdis.py +1 -3
pyobo/sources/selventa/sfam.py +1 -3
pyobo/sources/sgd.py +1 -3
pyobo/sources/slm.py +1 -3
pyobo/sources/umls/__init__.py +0 -2
pyobo/sources/umls/__main__.py +0 -2
pyobo/sources/umls/get_synonym_types.py +1 -1
pyobo/sources/umls/umls.py +2 -4
pyobo/sources/uniprot/__init__.py +0 -2
pyobo/sources/uniprot/uniprot.py +6 -6
pyobo/sources/uniprot/uniprot_ptm.py +6 -5
pyobo/sources/utils.py +3 -5
pyobo/sources/wikipathways.py +1 -3
pyobo/sources/zfin.py +2 -3
pyobo/ssg/__init__.py +3 -2
pyobo/struct/__init__.py +0 -2
pyobo/struct/reference.py +13 -15
pyobo/struct/struct.py +106 -99
pyobo/struct/typedef.py +19 -10
pyobo/struct/utils.py +0 -2
pyobo/utils/__init__.py +0 -2
pyobo/utils/cache.py +14 -6
pyobo/utils/io.py +9 -10
pyobo/utils/iter.py +5 -6
pyobo/utils/misc.py +1 -3
pyobo/utils/ndex_utils.py +6 -7
pyobo/utils/path.py +5 -5
pyobo/version.py +3 -5
pyobo/xrefdb/__init__.py +0 -2
pyobo/xrefdb/canonicalizer.py +27 -18
pyobo/xrefdb/priority.py +0 -2
pyobo/xrefdb/sources/__init__.py +9 -7
pyobo/xrefdb/sources/biomappings.py +0 -2
pyobo/xrefdb/sources/cbms2019.py +0 -2
pyobo/xrefdb/sources/chembl.py +5 -7
pyobo/xrefdb/sources/compath.py +1 -3
pyobo/xrefdb/sources/famplex.py +3 -5
pyobo/xrefdb/sources/gilda.py +0 -2
pyobo/xrefdb/sources/intact.py +5 -5
pyobo/xrefdb/sources/ncit.py +1 -3
pyobo/xrefdb/sources/pubchem.py +2 -4
pyobo/xrefdb/sources/wikidata.py +10 -5
pyobo/xrefdb/xrefs_pipeline.py +15 -16
{pyobo-0.10.11.dist-info → pyobo-0.11.0.dist-info}/LICENSE +1 -1
pyobo-0.11.0.dist-info/METADATA +723 -0
pyobo-0.11.0.dist-info/RECORD +171 -0
{pyobo-0.10.11.dist-info → pyobo-0.11.0.dist-info}/WHEEL +1 -1
pyobo-0.11.0.dist-info/entry_points.txt +2 -0
pyobo/xrefdb/bengo.py +0 -44
pyobo-0.10.11.dist-info/METADATA +0 -499
pyobo-0.10.11.dist-info/RECORD +0 -169
pyobo-0.10.11.dist-info/entry_points.txt +0 -15
{pyobo-0.10.11.dist-info → pyobo-0.11.0.dist-info}/top_level.txt +0 -0

pyobo/plugins.py CHANGED Viewed

@@ -1,9 +1,8 @@
-# -*- coding: utf-8 -*-
 """Tools for loading entry points."""
+from collections.abc import Iterable, Mapping
 from functools import lru_cache
-from typing import Callable, Iterable, Mapping, Optional
+from typing import Callable, Optional
 from .struct import Obo
@@ -14,7 +13,7 @@ __all__ = [
 ]
-@lru_cache()
+@lru_cache
 def _get_nomenclature_plugins() -> Mapping[str, Callable[[], Obo]]:
     from .sources import ontology_resolver

pyobo/py.typed ADDED Viewed

File without changes

pyobo/reader.py CHANGED Viewed

@@ -1,11 +1,10 @@
-# -*- coding: utf-8 -*-
 """OBO Readers."""
 import logging
+from collections.abc import Iterable, Mapping
 from datetime import datetime
 from pathlib import Path
-from typing import Any, Iterable, List, Mapping, Optional, Tuple, Union
+from typing import Any, Optional, Union
 import bioregistry
 import networkx as nx
@@ -13,7 +12,7 @@ from more_itertools import pairwise
 from tqdm.auto import tqdm
 from .constants import DATE_FORMAT, PROVENANCE_PREFIXES
-from .identifier_utils import MissingPrefix, normalize_curie
+from .identifier_utils import MissingPrefixError, normalize_curie
 from .registries import curie_has_blacklisted_prefix, curie_is_blacklisted, remap_prefix
 from .struct import (
     Obo,
@@ -39,7 +38,7 @@ logger = logging.getLogger(__name__)
 # FIXME use bioontologies
 # RELATION_REMAPPINGS: Mapping[str, Tuple[str, str]] = bioontologies.upgrade.load()
-RELATION_REMAPPINGS: Mapping[str, Tuple[str, str]] = {
+RELATION_REMAPPINGS: Mapping[str, tuple[str, str]] = {
     "part_of": part_of.pair,
     "has_part": has_part.pair,
     "develops_from": develops_from.pair,
@@ -75,7 +74,7 @@ def from_obo_path(
     return from_obonet(graph, strict=strict, **kwargs)
-def from_obonet(graph: nx.MultiDiGraph, *, strict: bool = True) -> "Obo":  # noqa:C901
+def from_obonet(graph: nx.MultiDiGraph, *, strict: bool = True) -> "Obo":
     """Get all of the terms from a OBO graph."""
     _ontology = graph.graph["ontology"]
     ontology = bioregistry.normalize_prefix(_ontology)  # probably always okay
@@ -126,12 +125,12 @@ def from_obonet(graph: nx.MultiDiGraph, *, strict: bool = True) -> "Obo":  # noq
         )
         for prefix, identifier, data in _iter_obo_graph(graph=graph, strict=strict)
     )
-    references: Mapping[Tuple[str, str], Reference] = {
+    references: Mapping[tuple[str, str], Reference] = {
         reference.pair: reference for reference in reference_it
     }
     #: CURIEs to typedefs
-    typedefs: Mapping[Tuple[str, str], TypeDef] = {
+    typedefs: Mapping[tuple[str, str], TypeDef] = {
         typedef.pair: typedef for typedef in iterate_graph_typedefs(graph, ontology)
     }
@@ -152,7 +151,7 @@ def from_obonet(graph: nx.MultiDiGraph, *, strict: bool = True) -> "Obo":  # noq
         try:
             node_xrefs = list(iterate_node_xrefs(prefix=prefix, data=data, strict=strict))
-        except MissingPrefix as e:
+        except MissingPrefixError as e:
             e.reference = reference
             raise e
         xrefs, provenance = [], []
@@ -171,7 +170,7 @@ def from_obonet(graph: nx.MultiDiGraph, *, strict: bool = True) -> "Obo":  # noq
         try:
             alt_ids = list(iterate_node_alt_ids(data, strict=strict))
-        except MissingPrefix as e:
+        except MissingPrefixError as e:
             e.reference = reference
             raise e
         n_alt_ids += len(alt_ids)
@@ -185,7 +184,7 @@ def from_obonet(graph: nx.MultiDiGraph, *, strict: bool = True) -> "Obo":  # noq
                     strict=strict,
                 )
             )
-        except MissingPrefix as e:
+        except MissingPrefixError as e:
             e.reference = reference
             raise e
         n_parents += len(parents)
@@ -220,7 +219,7 @@ def from_obonet(graph: nx.MultiDiGraph, *, strict: bool = True) -> "Obo":  # noq
                     strict=strict,
                 )
             )
-        except MissingPrefix as e:
+        except MissingPrefixError as e:
             e.reference = reference
             raise e
         for relation, reference in relations_references:
@@ -278,7 +277,7 @@ def _iter_obo_graph(
     graph: nx.MultiDiGraph,
     *,
     strict: bool = True,
-) -> Iterable[Tuple[str, str, Mapping[str, Any]]]:
+) -> Iterable[tuple[str, str, Mapping[str, Any]]]:
     """Iterate over the nodes in the graph with the prefix stripped (if it's there)."""
     for node, data in graph.nodes(data=True):
         prefix, identifier = normalize_curie(node, strict=strict)
@@ -366,7 +365,8 @@ def iterate_graph_typedefs(
 def get_definition(
     data, *, prefix: str, identifier: str
-) -> Union[Tuple[None, None], Tuple[str, List[Reference]]]:
+) -> Union[tuple[None, None], tuple[str, list[Reference]]]:
+    """Extract the definition from the data."""
     definition = data.get("def")  # it's allowed not to have a definition
     if not definition:
         return None, None
@@ -379,7 +379,7 @@ def _extract_definition(
     prefix: str,
     identifier: str,
     strict: bool = False,
-) -> Union[Tuple[None, None], Tuple[str, List[Reference]]]:
+) -> Union[tuple[None, None], tuple[str, list[Reference]]]:
     """Extract the definitions."""
     if not s.startswith('"'):
         raise ValueError("definition does not start with a quote")
@@ -405,7 +405,7 @@ def _get_first_nonquoted(s: str) -> Optional[int]:
     return None
-def _quote_split(s: str) -> Tuple[str, str]:
+def _quote_split(s: str) -> tuple[str, str]:
     s = s.lstrip('"')
     i = _get_first_nonquoted(s)
     if i is None:
@@ -416,9 +416,7 @@ def _quote_split(s: str) -> Tuple[str, str]:
 def _clean_definition(s: str) -> str:
     # if '\t' in s:
     #     logger.warning('has tab')
-    return (
-        s.replace('\\"', '"').replace("\n", " ").replace("\t", " ").replace("\d", "")  # noqa:W605
-    )
+    return s.replace('\\"', '"').replace("\n", " ").replace("\t", " ").replace(r"\d", "")
 def _extract_synonym(
@@ -516,7 +514,7 @@ HANDLED_PROPERTY_TYPES = {
 def iterate_node_properties(
     data: Mapping[str, Any], *, property_prefix: Optional[str] = None, term=None
-) -> Iterable[Tuple[str, str]]:
+) -> Iterable[tuple[str, str]]:
     """Extract properties from a :mod:`obonet` node's data."""
     for prop_value_type in data.get("property_value", []):
         try:
@@ -568,7 +566,7 @@ def iterate_node_relationships(
     prefix: str,
     identifier: str,
     strict: bool = True,
-) -> Iterable[Tuple[Reference, Reference]]:
+) -> Iterable[tuple[Reference, Reference]]:
     """Extract relationships from a :mod:`obonet` node's data."""
     for s in data.get("relationship", []):
         relation_curie, target_curie = s.split(" ")

pyobo/registries/__init__.py CHANGED Viewed

@@ -1,5 +1,3 @@
-# -*- coding: utf-8 -*-
 """Extract registry information."""
 from .metaregistry import (  # noqa: F401

pyobo/registries/metaregistry.py CHANGED Viewed

@@ -1,13 +1,11 @@
-# -*- coding: utf-8 -*-
 """Load the manually curated metaregistry."""
 import itertools as itt
 import json
 import os
+from collections.abc import Iterable, Mapping
 from functools import lru_cache
 from pathlib import Path
-from typing import Iterable, Mapping, Set, Tuple
 import bioregistry
@@ -25,7 +23,7 @@ def has_no_download(prefix: str) -> bool:
 @lru_cache(maxsize=1)
-def _no_download() -> Set[str]:
+def _no_download() -> set[str]:
     """Get the list of prefixes not available as OBO."""
     return {
         prefix
@@ -41,7 +39,7 @@ def curie_has_blacklisted_prefix(curie: str) -> bool:
 @lru_cache(maxsize=1)
-def get_xrefs_prefix_blacklist() -> Set[str]:
+def get_xrefs_prefix_blacklist() -> set[str]:
     """Get the set of blacklisted xref prefixes."""
     #: Xrefs starting with these prefixes will be ignored
     prefixes = set(
@@ -65,7 +63,7 @@ def curie_has_blacklisted_suffix(curie: str) -> bool:
 @lru_cache(maxsize=1)
-def get_xrefs_suffix_blacklist() -> Set[str]:
+def get_xrefs_suffix_blacklist() -> set[str]:
     """Get the set of blacklisted xref suffixes."""
     #: Xrefs ending with these suffixes will be ignored
     return set(CURATED_REGISTRY["blacklists"]["suffix"])
@@ -77,7 +75,7 @@ def curie_is_blacklisted(curie: str) -> bool:
 @lru_cache(maxsize=1)
-def get_xrefs_blacklist() -> Set[str]:
+def get_xrefs_blacklist() -> set[str]:
     """Get the set of blacklisted xrefs."""
     rv = set()
     for x in CURATED_REGISTRY["blacklists"]["full"]:
@@ -123,7 +121,7 @@ def remap_prefix(curie: str) -> str:
     return curie
-def iter_cached_obo() -> Iterable[Tuple[str, str]]:
+def iter_cached_obo() -> Iterable[tuple[str, str]]:
     """Iterate over cached OBO paths."""
     for prefix in os.listdir(RAW_DIRECTORY):
         if prefix in GLOBAL_SKIP or has_no_download(prefix) or bioregistry.is_deprecated(prefix):

pyobo/resource_utils.py CHANGED Viewed

@@ -1,9 +1,7 @@
-# -*- coding: utf-8 -*-
 """Resource utilities for PyOBO."""
+from collections.abc import Sequence
 from functools import lru_cache
-from typing import Sequence
 import click
 import pandas as pd

pyobo/resources/__init__.py CHANGED Viewed

@@ -1,3 +1 @@
-# -*- coding: utf-8 -*-
 """Pre-cached resources for PyOBO."""

pyobo/resources/ncbitaxon.py CHANGED Viewed

@@ -1,12 +1,11 @@
-# -*- coding: utf-8 -*-
 """Loading of the NCBI Taxonomy names."""
 import csv
 import gzip
+from collections.abc import Mapping
 from functools import lru_cache
 from pathlib import Path
-from typing import Mapping, Optional, Union
+from typing import Optional, Union
 import requests

pyobo/resources/ro.py CHANGED Viewed

@@ -1,11 +1,9 @@
-# -*- coding: utf-8 -*-
 """Loading of the relations ontology names."""
 import csv
 import os
+from collections.abc import Mapping
 from functools import lru_cache
-from typing import Mapping, Tuple
 import requests
@@ -20,7 +18,7 @@ PREFIX = "http://purl.obolibrary.org/obo/"
 @lru_cache(maxsize=1)
-def load_ro() -> Mapping[Tuple[str, str], str]:
+def load_ro() -> Mapping[tuple[str, str], str]:
     """Load the relation ontology names."""
     if not os.path.exists(PATH):
         download()

pyobo/sources/README.md ADDED Viewed

@@ -0,0 +1,15 @@
+# Sources
+1. Create a new module in `pyobo.sources` named with the prefix for the resource you're ontologizing
+2. Make sure your resource has a corresponding prefix in [the Bioregistry](https://github.com/biopragmatics/bioregistry)
+3. Subclass the `pyobo.Obo` class to represent your resource
+4. Add your resource to the list in `pyobo.sources.__init__`
+## What is in scope?
+1. Biomedical, semantic web, bibliographic, life sciences, and related natural sciences resources are welcome
+2. The source you want to ontologize should be an identifier resource, i.e., it mints its own identifiers. If you want
+   to ontologize some database that reuses some other identifier resource's identifiers, then this isn't the right
+   place.
+3. Resources that are not possible to download automatically are not in scope for PyOBO. Reproducibility and reusability
+   are core values of this software

pyobo/sources/__init__.py CHANGED Viewed

@@ -1,5 +1,3 @@
-# -*- coding: utf-8 -*-
 """Sources of OBO content."""
 from class_resolver import ClassResolver
@@ -12,6 +10,7 @@ from .civic_gene import CIVICGeneGetter
 from .complexportal import ComplexPortalGetter
 from .conso import CONSOGetter
 from .cpt import CPTGetter
+from .credit import CreditGetter
 from .cvx import CVXGetter
 from .depmap import DepMapGetter
 from .dictybase_gene import DictybaseGetter
@@ -69,6 +68,7 @@ __all__ = [
     "CVXGetter",
     "ChEMBLCompoundGetter",
     "ComplexPortalGetter",
+    "CreditGetter",
     "DepMapGetter",
     "DictybaseGetter",
     "DrugBankGetter",

pyobo/sources/agrovoc.py CHANGED Viewed

@@ -1,5 +1,3 @@
-# -*- coding: utf-8 -*-
 """Converter for AGROVOC."""
 import pystow
@@ -11,6 +9,8 @@ __all__ = [
     "ensure_agrovoc_graph",
 ]
+PREFIX = "agrovoc"
 def ensure_agrovoc_graph(version: str) -> Graph:
     """Download and parse the given version of AGROVOC."""
@@ -20,5 +20,5 @@ def ensure_agrovoc_graph(version: str) -> Graph:
     graph.bind("skosxl", "http://www.w3.org/2008/05/skos-xl#")
     graph.bind("skos", SKOS)
     graph.bind("dcterms", DCTERMS)
-    graph.bind("agrovoc", "http://aims.fao.org/aos/agrontology#")
+    graph.bind(PREFIX, "http://aims.fao.org/aos/agrontology#")
     return graph

pyobo/sources/antibodyregistry.py CHANGED Viewed

@@ -1,16 +1,15 @@
-# -*- coding: utf-8 -*-
 """Converter for the Antibody Registry."""
 import logging
-from typing import Iterable, Mapping, Optional
+from collections.abc import Iterable, Mapping
+from typing import Optional
-import bioversions
 import pandas as pd
 from bioregistry.utils import removeprefix
 from tqdm.auto import tqdm
 from pyobo import Obo, Term
+from pyobo.api.utils import get_version
 from pyobo.utils.path import ensure_df
 __all__ = [
@@ -27,7 +26,7 @@ CHUNKSIZE = 20_000
 def get_chunks(*, force: bool = False, version: Optional[str] = None) -> pd.DataFrame:
     """Get the BioGRID identifiers mapping dataframe."""
     if version is None:
-        version = bioversions.get_version(PREFIX)
+        version = get_version(PREFIX)
     df = ensure_df(
         PREFIX,
         url=URL,

pyobo/sources/biogrid.py CHANGED Viewed

@@ -1,13 +1,12 @@
-# -*- coding: utf-8 -*-
 """Extract and convert BioGRID identifiers."""
+from collections.abc import Mapping
 from functools import partial
-from typing import Mapping, Optional
+from typing import Optional
-import bioversions
 import pandas as pd
+from pyobo.api.utils import get_version
 from pyobo.resources.ncbitaxon import get_ncbitaxon_id
 from pyobo.utils.cache import cached_mapping
 from pyobo.utils.path import ensure_df, prefix_directory_join
@@ -52,7 +51,7 @@ def _lookup(name: str) -> Optional[str]:
 def get_df() -> pd.DataFrame:
     """Get the BioGRID identifiers mapping dataframe."""
-    version = bioversions.get_version("biogrid")
+    version = get_version("biogrid")
     url = f"{BASE_URL}/BIOGRID-{version}/BIOGRID-IDENTIFIERS-{version}.tab.zip"
     df = ensure_df(PREFIX, url=url, skiprows=28, dtype=str, version=version)
     df["taxonomy_id"] = df["ORGANISM_OFFICIAL_NAME"].map(_lookup)
@@ -65,7 +64,7 @@ def get_df() -> pd.DataFrame:
         "cache",
         "xrefs",
         name="ncbigene.tsv",
-        version=partial(bioversions.get_version, PREFIX),
+        version=partial(get_version, PREFIX),
     ),
     header=["biogrid_id", "ncbigene_id"],
 )
@@ -77,7 +76,8 @@ def get_ncbigene_mapping() -> Mapping[str, str]:
     .. code-block:: python
         from pyobo import get_filtered_xrefs
-        biogrid_ncbigene_mapping = get_filtered_xrefs('biogrid', 'ncbigene')
+        biogrid_ncbigene_mapping = get_filtered_xrefs("biogrid", "ncbigene")
     """
     df = get_df()
     df = df.loc[df["IDENTIFIER_TYPE"] == "ENTREZ_GENE", ["BIOGRID_ID", "IDENTIFIER_VALUE"]]

pyobo/sources/ccle.py CHANGED Viewed

@@ -1,10 +1,9 @@
-# -*- coding: utf-8 -*-
 """Get the CCLE Cells, provided by cBioPortal."""
 import tarfile
+from collections.abc import Iterable
 from pathlib import Path
-from typing import Iterable, Optional
+from typing import Optional
 import pandas as pd
 import pystow
@@ -25,7 +24,7 @@ class CCLEGetter(Obo):
     ontology = bioregistry_key = PREFIX
-    def __post_init__(self):  # noqa: D105
+    def __post_init__(self):
         self.data_version = VERSION
     def iter_terms(self, force: bool = False) -> Iterable[Term]:

pyobo/sources/cgnc.py CHANGED Viewed

@@ -1,9 +1,7 @@
-# -*- coding: utf-8 -*-
 """Converter for CGNC."""
 import logging
-from typing import Iterable
+from collections.abc import Iterable
 import pandas as pd

pyobo/sources/chebi.py CHANGED Viewed

@@ -1,8 +1,6 @@
-# -*- coding: utf-8 -*-
 """Converter for ChEBI."""
-from typing import Mapping, Set, Tuple
+from collections.abc import Mapping
 from ..api import get_filtered_properties_mapping, get_filtered_relations_df
 from ..struct import Reference, TypeDef
@@ -33,7 +31,7 @@ def get_chebi_smiles_id_mapping() -> Mapping[str, str]:
 has_role = TypeDef(reference=Reference(prefix="chebi", identifier="has_role"))
-def get_chebi_role_to_children() -> Mapping[str, Set[Tuple[str, str]]]:
+def get_chebi_role_to_children() -> Mapping[str, set[tuple[str, str]]]:
     """Get the ChEBI role to children mapping."""
     df = get_filtered_relations_df("chebi", relation=has_role)
     return multisetdict((role_id, ("chebi", chemical_id)) for chemical_id, _, role_id in df.values)

pyobo/sources/chembl.py CHANGED Viewed

@@ -1,13 +1,11 @@
-# -*- coding: utf-8 -*-
 """Converter for ChEMBL.
 Run with ``python -m pyobo.sources.chembl -vv``.
 """
 import logging
+from collections.abc import Iterable
 from contextlib import closing
-from typing import Iterable
 import chembl_downloader

pyobo/sources/civic_gene.py CHANGED Viewed

@@ -1,8 +1,7 @@
-# -*- coding: utf-8 -*-
 """Converter for CiVIC Genes."""
-from typing import Iterable, Optional
+from collections.abc import Iterable
+from typing import Optional
 import pandas as pd

pyobo/sources/complexportal.py CHANGED Viewed

@@ -1,9 +1,7 @@
-# -*- coding: utf-8 -*-
 """Converter for ComplexPortal."""
 import logging
-from typing import Iterable, List, Tuple
+from collections.abc import Iterable
 import pandas as pd
 from tqdm.auto import tqdm
@@ -52,7 +50,7 @@ DTYPE = {
 }
-def _parse_members(s) -> List[Tuple[Reference, str]]:
+def _parse_members(s) -> list[tuple[Reference, str]]:
     if pd.isna(s):
         return []
@@ -68,7 +66,7 @@ def _parse_members(s) -> List[Tuple[Reference, str]]:
     return rv
-def _parse_xrefs(s) -> List[Tuple[Reference, str]]:
+def _parse_xrefs(s) -> list[tuple[Reference, str]]:
     if pd.isna(s):
         return []

pyobo/sources/conso.py CHANGED Viewed

@@ -1,8 +1,6 @@
-# -*- coding: utf-8 -*-
 """Converter for CONSO."""
-from typing import Iterable, List
+from collections.abc import Iterable
 import pandas as pd
@@ -68,7 +66,7 @@ def iter_terms() -> Iterable[Term]:
     for _, row in terms_df.iterrows():
         if row["Name"] == "WITHDRAWN":
             continue
-        provenance: List[Reference] = []
+        provenance: list[Reference] = []
         for curie in row["References"].split(","):
             curie = curie.strip()
             if not curie:

pyobo/sources/cpt.py CHANGED Viewed

@@ -1,8 +1,6 @@
-# -*- coding: utf-8 -*-
 """Converter for CPT."""
-from typing import Iterable
+from collections.abc import Iterable
 import pandas as pd

pyobo/sources/credit.py ADDED Viewed

@@ -0,0 +1,68 @@
+"""Converter for the Contributor Roles Taxonomy."""
+from __future__ import annotations
+import json
+from collections.abc import Iterable
+from more_itertools import chunked
+from pyobo.struct import Obo, Term
+from pyobo.utils.path import ensure_path
+__all__ = [
+    "CreditGetter",
+]
+url = "https://api.github.com/repos/CASRAI-CRedIT/Dictionary/contents/Picklists/Contributor%20Roles"
+PREFIX = "credit"
+class CreditGetter(Obo):
+    """An ontology representation of the Contributor Roles Taxonomy."""
+    ontology = PREFIX
+    static_version = "2022"
+    idspaces = {
+        PREFIX: "https://credit.niso.org/contributor-roles/",
+    }
+    def iter_terms(self, force: bool = False) -> Iterable[Term]:
+        """Iterate over terms in the ontology."""
+        return get_terms(force=force)
+def get_obo(force: bool = False) -> Obo:
+    """Get RGD as OBO."""
+    return CreditGetter(force=force)
+def get_terms(force: bool = False) -> list[Term]:
+    """Get terms from the Contributor Roles Taxonomy via GitHub."""
+    path = ensure_path(PREFIX, url=url, name="picklist-api.json", force=force)
+    with open(path) as f:
+        data = json.load(f)
+    terms = []
+    for x in data:
+        name = x["name"].removesuffix(".md").lower()
+        pp = ensure_path(PREFIX, "picklist", url=x["download_url"], backend="requests")
+        with open(pp) as f:
+            header, *rest = f.read().splitlines()
+            name = header = header.removeprefix("# Contributor Roles/")
+            dd = {k.removeprefix("## "): v for k, v in chunked(rest, 2)}
+            identifier = (
+                dd["Canonical URL"]
+                .removeprefix("https://credit.niso.org/contributor-roles/")
+                .rstrip("/")
+            )
+            desc = dd["Short definition"]
+            terms.append(
+                Term.from_triple(prefix=PREFIX, identifier=identifier, name=name, definition=desc)
+            )
+    return terms
+if __name__ == "__main__":
+    get_obo(force=True).write_default(write_obo=True)

pyobo/sources/cvx.py CHANGED Viewed

@@ -1,9 +1,7 @@
-# -*- coding: utf-8 -*-
 """Converter for CVX."""
 from collections import defaultdict
-from typing import Iterable
+from collections.abc import Iterable
 import pandas as pd

pyobo/sources/depmap.py CHANGED Viewed

@@ -1,8 +1,7 @@
-# -*- coding: utf-8 -*-
 """DepMap cell lines."""
-from typing import Iterable, Optional
+from collections.abc import Iterable
+from typing import Optional
 import pandas as pd
 import pystow
@@ -113,7 +112,7 @@ def ensure(version: str, force: bool = False) -> pd.DataFrame:
         url=get_url(version=version),
         name="sample_info.tsv",
         force=force,
-        read_csv_kwargs=dict(sep=",", dtype=str),
+        read_csv_kwargs={"sep": ",", "dtype": str},
     )

pyobo 0.10.11__py3-none-any.whl → 0.11.0__py3-none-any.whl

pyobo 0.10.11py3-none-any.whl → 0.11.0py3-none-any.whl