PyPI - protein-quest - Versions diffs - 0.3.0__py3-none-any.whl - Mend

protein-quest 0.3.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of protein-quest might be problematic. Click here for more details.

Files changed (24) hide show

protein_quest/__init__.py +0 -0
protein_quest/__version__.py +1 -0
protein_quest/alphafold/__init__.py +1 -0
protein_quest/alphafold/confidence.py +153 -0
protein_quest/alphafold/entry_summary.py +38 -0
protein_quest/alphafold/fetch.py +314 -0
protein_quest/cli.py +782 -0
protein_quest/emdb.py +34 -0
protein_quest/filters.py +107 -0
protein_quest/go.py +168 -0
protein_quest/mcp_server.py +208 -0
protein_quest/parallel.py +68 -0
protein_quest/pdbe/__init__.py +1 -0
protein_quest/pdbe/fetch.py +51 -0
protein_quest/pdbe/io.py +185 -0
protein_quest/py.typed +0 -0
protein_quest/taxonomy.py +139 -0
protein_quest/uniprot.py +511 -0
protein_quest/utils.py +105 -0
protein_quest-0.3.0.dist-info/METADATA +219 -0
protein_quest-0.3.0.dist-info/RECORD +24 -0
protein_quest-0.3.0.dist-info/WHEEL +4 -0
protein_quest-0.3.0.dist-info/entry_points.txt +2 -0
protein_quest-0.3.0.dist-info/licenses/LICENSE +201 -0

protein_quest/uniprot.py ADDED Viewed

@@ -0,0 +1,511 @@
+"""Module for searching UniProtKB using SPARQL."""
+import logging
+from collections.abc import Collection, Iterable
+from dataclasses import dataclass
+from itertools import batched
+from textwrap import dedent
+from SPARQLWrapper import JSON, SPARQLWrapper
+from tqdm.auto import tqdm
+logger = logging.getLogger(__name__)
+@dataclass
+class Query:
+    """Search query for UniProtKB.
+    Parameters:
+        taxon_id: NCBI Taxon ID to filter results by organism (e.g., "9606" for human).
+        reviewed: Whether to filter results by reviewed status (True for reviewed, False for unreviewed).
+        subcellular_location_uniprot: Subcellular location in UniProt format (e.g., "nucleus").
+        subcellular_location_go: Subcellular location in GO format. Can be a single GO term
+            (e.g., ["GO:0005634"]) or a collection of GO terms (e.g., ["GO:0005634", "GO:0005737"]).
+        molecular_function_go: Molecular function in GO format. Can be a single GO term
+            (e.g., ["GO:0003674"]) or a collection of GO terms (e.g., ["GO:0003674", "GO:0008150"]).
+    """
+    # TODO make taxon_id an int
+    taxon_id: str | None
+    reviewed: bool | None = None
+    subcellular_location_uniprot: str | None = None
+    subcellular_location_go: list[str] | None = None
+    molecular_function_go: list[str] | None = None
+def _first_chain_from_uniprot_chains(uniprot_chains: str) -> str:
+    """Extracts the first chain identifier from a UniProt chains string.
+    The UniProt chains string is formatted (with EBNF notation) as follows:
+        chain_group(=range)?(,chain_group(=range)?)*
+    where:
+        chain_group := chain_id(/chain_id)*
+        chain_id    := [A-Za-z]+
+        range       := start-end
+        start, end  := integer
+    Args:
+        uniprot_chains: A string representing UniProt chains, For example "B/D=1-81".
+    Returns:
+        The first chain identifier from the UniProt chain string. For example "B".
+    """
+    chains = uniprot_chains.split("=")
+    parts = chains[0].split("/")
+    chain = parts[0]
+    try:
+        # Workaround for Q9Y2Q5 │ 5YK3 │ 1/B/G=1-124, 1 does not exist but B does
+        int(chain)
+        if len(parts) > 1:
+            return parts[1]
+    except ValueError:
+        # A letter
+        pass
+    return chain
+@dataclass(frozen=True)
+class PdbResult:
+    """Result of a PDB search in UniProtKB.
+    Parameters:
+        id: PDB ID (e.g., "1H3O").
+        method: Method used for the PDB entry (e.g., "X-ray diffraction").
+        uniprot_chains: Chains in UniProt format (e.g., "A/B=1-42,A/B=50-99").
+        resolution: Resolution of the PDB entry (e.g., "2.0" for 2.0 Å). Optional.
+    """
+    id: str
+    method: str
+    uniprot_chains: str
+    resolution: str | None = None
+    @property
+    def chain(self) -> str:
+        """The first chain from the UniProt chains aka self.uniprot_chains."""
+        return _first_chain_from_uniprot_chains(self.uniprot_chains)
+def _query2dynamic_sparql_triples(query: Query):
+    parts: list[str] = []
+    if query.taxon_id:
+        parts.append(f"?protein up:organism taxon:{query.taxon_id} .")
+    if query.reviewed:
+        parts.append("?protein up:reviewed true .")
+    elif query.reviewed is False:
+        parts.append("?protein up:reviewed false .")
+    parts.append(_append_subcellular_location_filters(query))
+    if query.molecular_function_go:
+        # Handle both single GO term (string) and multiple GO terms (list)
+        if isinstance(query.molecular_function_go, str):
+            go_terms = [query.molecular_function_go]
+        else:
+            go_terms = query.molecular_function_go
+        molecular_function_filter = _create_go_filter(go_terms, "Molecular function")
+        parts.append(molecular_function_filter)
+    return "\n".join(parts)
+def _create_go_filter(go_terms: Collection[str], term_type: str) -> str:
+    """Create SPARQL filter for GO terms.
+    Args:
+        go_terms: Collection of GO terms to filter by.
+        term_type: Type of GO terms for error messages (e.g., "Molecular function", "Subcellular location").
+    Returns:
+        SPARQL filter string.
+    """
+    # Validate all GO terms start with "GO:"
+    for term in go_terms:
+        if not term.startswith("GO:"):
+            msg = f"{term_type} GO term must start with 'GO:', got: {term}"
+            raise ValueError(msg)
+    if len(go_terms) == 1:
+        # Single GO term - get the first (and only) term
+        term = next(iter(go_terms))
+        return dedent(f"""
+            ?protein up:classifiedWith|(up:classifiedWith/rdfs:subClassOf+) {term} .
+        """)
+    # Multiple GO terms - use UNION for OR logic
+    union_parts = [
+        dedent(f"""
+            {{ ?protein up:classifiedWith|(up:classifiedWith/rdfs:subClassOf+) {term} . }}
+        """).strip()
+        for term in go_terms
+    ]
+    return " UNION ".join(union_parts)
+def _append_subcellular_location_filters(query: Query) -> str:
+    subcellular_location_uniprot_part = ""
+    subcellular_location_go_part = ""
+    if query.subcellular_location_uniprot:
+        subcellular_location_uniprot_part = dedent(f"""
+            ?protein up:annotation ?subcellAnnotation .
+            ?subcellAnnotation up:locatedIn/up:cellularComponent ?cellcmpt .
+            ?cellcmpt skos:prefLabel "{query.subcellular_location_uniprot}" .
+        """)
+    if query.subcellular_location_go:
+        # Handle both single GO term (string) and multiple GO terms (list)
+        if isinstance(query.subcellular_location_go, str):
+            go_terms = [query.subcellular_location_go]
+        else:
+            go_terms = query.subcellular_location_go
+        subcellular_location_go_part = _create_go_filter(go_terms, "Subcellular location")
+    if subcellular_location_uniprot_part and subcellular_location_go_part:
+        # If both are provided include results for both with logical OR
+        return dedent(f"""
+            {{
+                {subcellular_location_uniprot_part}
+            }} UNION {{
+                {subcellular_location_go_part}
+            }}
+        """)
+    return subcellular_location_uniprot_part or subcellular_location_go_part
+def _build_sparql_generic_query(select_clause: str, where_clause: str, limit: int = 10_000, groupby_clause="") -> str:
+    """
+    Builds a generic SPARQL query with the given select and where clauses.
+    """
+    groupby = f" GROUP BY {groupby_clause}" if groupby_clause else ""
+    return dedent(f"""
+        PREFIX up: <http://purl.uniprot.org/core/>
+        PREFIX taxon: <http://purl.uniprot.org/taxonomy/>
+        PREFIX rdf: <http://www.w3.org/1999/02/22-rdf-syntax-ns#>
+        PREFIX rdfs: <http://www.w3.org/2000/01/rdf-schema#>
+        PREFIX skos: <http://www.w3.org/2004/02/skos/core#>
+        PREFIX GO:<http://purl.obolibrary.org/obo/GO_>
+        SELECT {select_clause}
+        WHERE {{
+            {where_clause}
+        }}
+        {groupby}
+        LIMIT {limit}
+    """)
+def _build_sparql_generic_by_uniprot_accesions_query(
+    uniprot_accs: Iterable[str], select_clause: str, where_clause: str, limit: int = 10_000, groupby_clause=""
+) -> str:
+    values = " ".join(f'("{ac}")' for ac in uniprot_accs)
+    where_clause2 = dedent(f"""
+        # --- Protein Selection ---
+        VALUES (?ac) {{ {values}}}
+        BIND (IRI(CONCAT("http://purl.uniprot.org/uniprot/",?ac)) AS ?protein)
+        ?protein a up:Protein .
+        {where_clause}
+    """)
+    return _build_sparql_generic_query(
+        select_clause=select_clause,
+        where_clause=where_clause2,
+        limit=limit,
+        groupby_clause=groupby_clause,
+    )
+def _build_sparql_query_uniprot(query: Query, limit=10_000) -> str:
+    dynamic_triples = _query2dynamic_sparql_triples(query)
+    # TODO add usefull columns that have 1:1 mapping to protein
+    # like uniprot_id with `?protein up:mnemonic ?mnemonic .`
+    # and sequence, take care to take first isoform
+    # ?protein up:sequence ?isoform .
+    # ?isoform rdf:value ?sequence .
+    select_clause = "DISTINCT ?protein"
+    where_clause = dedent(f"""
+        # --- Protein Selection ---
+        ?protein a up:Protein .
+        {dynamic_triples}
+    """)
+    return _build_sparql_generic_query(select_clause, dedent(where_clause), limit)
+def _build_sparql_query_pdb(uniprot_accs: Iterable[str], limit=10_000) -> str:
+    # For http://purl.uniprot.org/uniprot/O00268 + http://rdf.wwpdb.org/pdb/1H3O
+    # the chainSequenceMapping are
+    # http://purl.uniprot.org/isoforms/O00268-1#PDB_1H3O_tt872tt945
+    # http://purl.uniprot.org/isoforms/Q16514-1#PDB_1H3O_tt57tt128
+    # For http://purl.uniprot.org/uniprot/O00255 + http://rdf.wwpdb.org/pdb/3U84
+    # the chainSequenceMapping are
+    # http://purl.uniprot.org/isoforms/O00255-2#PDB_3U84_tt520tt610
+    # http://purl.uniprot.org/isoforms/O00255-2#PDB_3U84_tt2tt459
+    # To get the the chain belonging to the uniprot/pdb pair we need to
+    # do some string filtering.
+    # Also there can be multiple cnhins for the same uniprot/pdb pair, so we need to
+    # do a group by and concat
+    select_clause = dedent("""\
+        ?protein ?pdb_db ?pdb_method ?pdb_resolution
+         (GROUP_CONCAT(DISTINCT ?pdb_chain; separator=",") AS ?pdb_chains)
+    """)
+    where_clause = dedent("""
+        # --- PDB Info ---
+        ?protein rdfs:seeAlso ?pdb_db .
+        ?pdb_db up:database <http://purl.uniprot.org/database/PDB> .
+        ?pdb_db up:method ?pdb_method .
+        ?pdb_db up:chainSequenceMapping ?chainSequenceMapping .
+        BIND(STRAFTER(STR(?chainSequenceMapping), "isoforms/") AS ?isoformPart)
+        FILTER(STRSTARTS(?isoformPart, CONCAT(?ac, "-")))
+        ?chainSequenceMapping up:chain ?pdb_chain .
+        OPTIONAL { ?pdb_db up:resolution ?pdb_resolution . }
+    """)
+    groupby_clause = "?protein ?pdb_db ?pdb_method ?pdb_resolution"
+    return _build_sparql_generic_by_uniprot_accesions_query(
+        uniprot_accs, select_clause, where_clause, limit, groupby_clause
+    )
+def _build_sparql_query_af(uniprot_accs: Iterable[str], limit=10_000) -> str:
+    select_clause = "?protein ?af_db"
+    where_clause = dedent("""
+        # --- Protein Selection ---
+        ?protein a up:Protein .
+        # --- AlphaFoldDB Info ---
+        ?protein rdfs:seeAlso ?af_db .
+        ?af_db up:database <http://purl.uniprot.org/database/AlphaFoldDB> .
+    """)
+    return _build_sparql_generic_by_uniprot_accesions_query(uniprot_accs, select_clause, dedent(where_clause), limit)
+def _build_sparql_query_emdb(uniprot_accs: Iterable[str], limit=10_000) -> str:
+    select_clause = "?protein ?emdb_db"
+    where_clause = dedent("""
+        # --- Protein Selection ---
+        ?protein a up:Protein .
+        # --- EMDB Info ---
+        ?protein rdfs:seeAlso ?emdb_db .
+        ?emdb_db up:database <http://purl.uniprot.org/database/EMDB> .
+    """)
+    return _build_sparql_generic_by_uniprot_accesions_query(uniprot_accs, select_clause, dedent(where_clause), limit)
+def _execute_sparql_search(
+    sparql_query: str,
+    timeout: int,
+) -> list:
+    """
+    Execute a SPARQL query.
+    """
+    if timeout > 2_700:
+        msg = "Uniprot SPARQL timeout is limited to 2700 seconds (45 minutes)."
+        raise ValueError(msg)
+    # Execute the query
+    sparql = SPARQLWrapper("https://sparql.uniprot.org/sparql")
+    sparql.setReturnFormat(JSON)
+    sparql.setTimeout(timeout)
+    # Default is GET method which can be cached by the server so is preferred.
+    # Too prevent URITooLong errors, we use POST method for large queries.
+    too_long_for_get = 5_000
+    if len(sparql_query) > too_long_for_get:
+        sparql.setMethod("POST")
+    sparql.setQuery(sparql_query)
+    rawresults = sparql.queryAndConvert()
+    if not isinstance(rawresults, dict):
+        msg = f"Expected rawresults to be a dict, but got {type(rawresults)}"
+        raise TypeError(msg)
+    bindings = rawresults.get("results", {}).get("bindings")
+    if not isinstance(bindings, list):
+        logger.warning("SPARQL query did not return 'bindings' list as expected.")
+        return []
+    logger.debug(bindings)
+    return bindings
+def _flatten_results_pdb(rawresults: Iterable) -> dict[str, set[PdbResult]]:
+    pdb_entries: dict[str, set[PdbResult]] = {}
+    for result in rawresults:
+        protein = result["protein"]["value"].split("/")[-1]
+        if "pdb_db" not in result:  # Should not happen with build_sparql_query_pdb
+            continue
+        pdb_id = result["pdb_db"]["value"].split("/")[-1]
+        method = result["pdb_method"]["value"].split("/")[-1]
+        uniprot_chains = result["pdb_chains"]["value"]
+        pdb = PdbResult(id=pdb_id, method=method, uniprot_chains=uniprot_chains)
+        if "pdb_resolution" in result:
+            pdb = PdbResult(
+                id=pdb_id,
+                method=method,
+                uniprot_chains=uniprot_chains,
+                resolution=result["pdb_resolution"]["value"],
+            )
+        if protein not in pdb_entries:
+            pdb_entries[protein] = set()
+        pdb_entries[protein].add(pdb)
+    return pdb_entries
+def _flatten_results_af(rawresults: Iterable) -> dict[str, set[str]]:
+    alphafold_entries: dict[str, set[str]] = {}
+    for result in rawresults:
+        protein = result["protein"]["value"].split("/")[-1]
+        if "af_db" in result:
+            af_id = result["af_db"]["value"].split("/")[-1]
+            if protein not in alphafold_entries:
+                alphafold_entries[protein] = set()
+            alphafold_entries[protein].add(af_id)
+    return alphafold_entries
+def _flatten_results_emdb(rawresults: Iterable) -> dict[str, set[str]]:
+    emdb_entries: dict[str, set[str]] = {}
+    for result in rawresults:
+        protein = result["protein"]["value"].split("/")[-1]
+        if "emdb_db" in result:
+            emdb_id = result["emdb_db"]["value"].split("/")[-1]
+            if protein not in emdb_entries:
+                emdb_entries[protein] = set()
+            emdb_entries[protein].add(emdb_id)
+    return emdb_entries
+def limit_check(what: str, limit: int, len_raw_results: int):
+    if len_raw_results >= limit:
+        logger.warning(
+            "%s returned %d results. "
+            "There may be more results available, "
+            "but they are not returned due to the limit of %d. "
+            "Consider increasing the limit to get more results.",
+            what,
+            len_raw_results,
+            limit,
+        )
+def search4uniprot(query: Query, limit: int = 10_000, timeout: int = 1_800) -> set[str]:
+    """
+    Search for UniProtKB entries based on the given query.
+    Args:
+        query: Query object containing search parameters.
+        limit: Maximum number of results to return.
+        timeout: Timeout for the SPARQL query in seconds.
+    Returns:
+        Set of uniprot accessions.
+    """
+    sparql_query = _build_sparql_query_uniprot(query, limit)
+    logger.info("Executing SPARQL query for UniProt: %s", sparql_query)
+    # Type assertion is needed because _execute_sparql_search returns a Union
+    raw_results = _execute_sparql_search(
+        sparql_query=sparql_query,
+        timeout=timeout,
+    )
+    limit_check("Search for uniprot accessions", limit, len(raw_results))
+    return {result["protein"]["value"].split("/")[-1] for result in raw_results}
+def search4pdb(
+    uniprot_accs: Collection[str], limit: int = 10_000, timeout: int = 1_800, batch_size: int = 10_000
+) -> dict[str, set[PdbResult]]:
+    """
+    Search for PDB entries in UniProtKB accessions.
+    Args:
+        uniprot_accs: UniProt accessions.
+        limit: Maximum number of results to return.
+        timeout: Timeout for the SPARQL query in seconds.
+        batch_size: Size of batches to process the UniProt accessions.
+    Returns:
+        Dictionary with protein IDs as keys and sets of PDB results as values.
+    """
+    all_raw_results = []
+    total = len(uniprot_accs)
+    with tqdm(total=total, desc="Searching for PDBs of uniprots", disable=total < batch_size, unit="acc") as pbar:
+        for batch in batched(uniprot_accs, batch_size, strict=False):
+            sparql_query = _build_sparql_query_pdb(batch, limit)
+            logger.info("Executing SPARQL query for PDB: %s", sparql_query)
+            raw_results = _execute_sparql_search(
+                sparql_query=sparql_query,
+                timeout=timeout,
+            )
+            all_raw_results.extend(raw_results)
+            pbar.update(len(batch))
+    limit_check("Search for pdbs on uniprot", limit, len(all_raw_results))
+    return _flatten_results_pdb(all_raw_results)
+def search4af(
+    uniprot_accs: Collection[str], limit: int = 10_000, timeout: int = 1_800, batch_size: int = 10_000
+) -> dict[str, set[str]]:
+    """
+    Search for AlphaFold entries in UniProtKB accessions.
+    Args:
+        uniprot_accs: UniProt accessions.
+        limit: Maximum number of results to return.
+        timeout: Timeout for the SPARQL query in seconds.
+        batch_size: Size of batches to process the UniProt accessions.
+    Returns:
+        Dictionary with protein IDs as keys and sets of AlphaFold IDs as values.
+    """
+    all_raw_results = []
+    total = len(uniprot_accs)
+    with tqdm(total=total, desc="Searching for AlphaFolds of uniprots", disable=total < batch_size, unit="acc") as pbar:
+        for batch in batched(uniprot_accs, batch_size, strict=False):
+            sparql_query = _build_sparql_query_af(batch, limit)
+            logger.info("Executing SPARQL query for AlphaFold: %s", sparql_query)
+            raw_results = _execute_sparql_search(
+                sparql_query=sparql_query,
+                timeout=timeout,
+            )
+            all_raw_results.extend(raw_results)
+            pbar.update(len(batch))
+    limit_check("Search for alphafold entries on uniprot", limit, len(all_raw_results))
+    return _flatten_results_af(all_raw_results)
+def search4emdb(uniprot_accs: Iterable[str], limit: int = 10_000, timeout: int = 1_800) -> dict[str, set[str]]:
+    """
+    Search for EMDB entries in UniProtKB accessions.
+    Args:
+        uniprot_accs: UniProt accessions.
+        limit: Maximum number of results to return.
+        timeout: Timeout for the SPARQL query in seconds.
+    Returns:
+        Dictionary with protein IDs as keys and sets of EMDB IDs as values.
+    """
+    sparql_query = _build_sparql_query_emdb(uniprot_accs, limit)
+    logger.info("Executing SPARQL query for EMDB: %s", sparql_query)
+    raw_results = _execute_sparql_search(
+        sparql_query=sparql_query,
+        timeout=timeout,
+    )
+    limit_check("Search for EMDB entries on uniprot", limit, len(raw_results))
+    return _flatten_results_emdb(raw_results)

protein_quest/utils.py ADDED Viewed

@@ -0,0 +1,105 @@
+"""Module for functions that are used in multiple places."""
+import asyncio
+import logging
+from collections.abc import Iterable
+from contextlib import asynccontextmanager
+from pathlib import Path
+import aiofiles
+import aiohttp
+from aiohttp_retry import ExponentialRetry, RetryClient
+from tqdm.asyncio import tqdm
+logger = logging.getLogger(__name__)
+async def retrieve_files(
+    urls: Iterable[tuple[str, str]],
+    save_dir: Path,
+    max_parallel_downloads: int = 5,
+    retries: int = 3,
+    total_timeout: int = 300,
+    desc: str = "Downloading files",
+) -> list[Path]:
+    """Retrieve files from a list of URLs and save them to a directory.
+    Args:
+        urls: A list of tuples, where each tuple contains a URL and a filename.
+        save_dir: The directory to save the downloaded files to.
+        max_parallel_downloads: The maximum number of files to download in parallel.
+        retries: The number of times to retry a failed download.
+        total_timeout: The total timeout for a download in seconds.
+        desc: Description for the progress bar.
+    Returns:
+        A list of paths to the downloaded files.
+    """
+    save_dir.mkdir(parents=True, exist_ok=True)
+    semaphore = asyncio.Semaphore(max_parallel_downloads)
+    async with friendly_session(retries, total_timeout) as session:
+        tasks = [_retrieve_file(session, url, save_dir / filename, semaphore) for url, filename in urls]
+        files: list[Path] = await tqdm.gather(*tasks, desc=desc)
+        return files
+async def _retrieve_file(
+    session: RetryClient,
+    url: str,
+    save_path: Path,
+    semaphore: asyncio.Semaphore,
+    ovewrite: bool = False,
+    chunk_size: int = 131072,  # 128 KiB
+) -> Path:
+    """Retrieve a single file from a URL and save it to a specified path.
+    Args:
+        session: The aiohttp session to use for the request.
+        url: The URL to download the file from.
+        save_path: The path where the file should be saved.
+        semaphore: A semaphore to limit the number of concurrent downloads.
+        ovewrite: Whether to overwrite the file if it already exists.
+        chunk_size: The size of each chunk to read from the response.
+    Returns:
+        The path to the saved file.
+    """
+    if save_path.exists():
+        if ovewrite:
+            save_path.unlink()
+        else:
+            logger.debug(f"File {save_path} already exists. Skipping download from {url}.")
+            return save_path
+    async with (
+        semaphore,
+        aiofiles.open(save_path, "xb") as f,
+        session.get(url) as resp,
+    ):
+        resp.raise_for_status()
+        async for chunk in resp.content.iter_chunked(chunk_size):
+            await f.write(chunk)
+    return save_path
+@asynccontextmanager
+async def friendly_session(retries: int = 3, total_timeout: int = 300):
+    """Create an aiohttp session with retry capabilities.
+    Examples:
+        Use as async context:
+        >>> async with friendly_session(retries=5, total_timeout=60) as session:
+        >>>     r = await session.get("https://example.com/api/data")
+        >>>     print(r)
+        <ClientResponse(https://example.com/api/data) [404 Not Found]>
+        <CIMultiDictProxy('Accept-Ranges': 'bytes', ...
+    Args:
+        retries: The number of retry attempts for failed requests.
+        total_timeout: The total timeout for a request in seconds.
+    """
+    retry_options = ExponentialRetry(attempts=retries)
+    timeout = aiohttp.ClientTimeout(total=total_timeout)  # pyrefly: ignore false positive
+    async with aiohttp.ClientSession(timeout=timeout) as session:
+        client = RetryClient(client_session=session, retry_options=retry_options)
+        yield client