PyPI - nv-ingest-api - Versions diffs - 2025.4.17.dev20250417__py3-none-any.whl → 2025.4.18.dev20250418__py3-none-any.whl - Mend - Supply Chain Defender

nv-ingest-api 2025.4.17.dev20250417py3-none-any.whl → 2025.4.18.dev20250418py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of nv-ingest-api might be problematic. Click here for more details.

Files changed (9) hide show

nv_ingest_api/util/service_clients/rest/rest_client.py CHANGED Viewed

@@ -2,14 +2,12 @@
 # All rights reserved.
 # SPDX-License-Identifier: Apache-2.0
-# pylint: skip-file
 import logging
 import re
 import time
-from typing import Any
+from typing import Any, Union, Tuple, Optional, Dict, Callable
+from urllib.parse import urlparse
-import httpx
 import requests
 from nv_ingest_api.internal.schemas.message_brokers.response_schema import ResponseSchema
@@ -64,28 +62,11 @@ _TERMINAL_RESPONSE_STATUSES = [
 class RestClient(MessageBrokerClientBase):
     """
-    A client for interfacing with the nv-ingest HTTP endpoint, providing mechanisms for sending and receiving messages
-    with retry logic and connection management.
-    Parameters
-    ----------
-    host : str
-        The hostname of the HTTP server.
-    port : int
-        The port number of the HTTP server.
-    max_retries : int, optional
-        The maximum number of retry attempts for operations. Default is 0 (no retries).
-    max_backoff : int, optional
-        The maximum backoff delay between retries in seconds. Default is 32 seconds.
-    connection_timeout : int, optional
-        The timeout in seconds for connecting to the HTTP server. Default is 300 seconds.
-    http_allocator : Any, optional
-        The HTTP client allocator.
-    Attributes
-    ----------
-    client : Any
-        The HTTP client instance used for operations.
+    A client for interfacing with an HTTP endpoint (e.g., nv-ingest), providing mechanisms for sending
+    and receiving messages with retry logic using the `requests` library by default, but allowing a custom
+    HTTP client allocator.
+    Extends MessageBrokerClientBase for interface compatibility.
     """
     def __init__(
@@ -94,305 +75,457 @@ class RestClient(MessageBrokerClientBase):
         port: int,
         max_retries: int = 0,
         max_backoff: int = 32,
-        connection_timeout: int = 300,
-        http_allocator: Any = httpx.AsyncClient,
+        default_connect_timeout: float = 300.0,
+        default_read_timeout: Optional[float] = None,
+        http_allocator: Optional[Callable[[], Any]] = None,
         **kwargs,
-    ):
-        self._host = host
-        self._port = port
-        self._max_retries = max_retries
-        self._max_backoff = max_backoff
-        self._connection_timeout = connection_timeout
-        self._http_allocator = http_allocator
-        self._client = self._http_allocator()
-        self._retries = 0
-        self._submit_endpoint = "/v1/submit_job"
-        self._fetch_endpoint = "/v1/fetch_job"
-        if "base_url" in kwargs:
-            logger.debug("Using custom base_url; ignoring host and port")
-        self._base_url = kwargs.get("base_url") or self.generate_url(self._host, self._port)
+    ) -> None:
+        """
+        Initializes the RestClient.
+        By default, uses `requests.Session`. If `http_allocator` is provided, it will be called to instantiate
+        the client. If a custom allocator is used, the internal methods (`fetch_message`, `submit_message`)
+        might need adjustments if the allocated client's API differs significantly from `requests.Session`.
+        Parameters
+        ----------
+        host : str
+            The hostname or IP address of the HTTP server.
+        port : int
+            The port number of the HTTP server.
+        max_retries : int, optional
+            Maximum number of retry attempts for connection errors or specific retryable HTTP statuses. Default is 0.
+        max_backoff : int, optional
+            Maximum backoff delay between retries, in seconds. Default is 32.
+        default_connect_timeout : float, optional
+            Default timeout in seconds for establishing a connection. Default is 300.0.
+        default_read_timeout : float, optional
+            Default timeout in seconds for waiting for data after connection. Default is None.
+        http_allocator : Optional[Callable[[], Any]], optional
+            A callable that returns an HTTP client instance. If None, `requests.Session()` is used.
+        Returns
+        -------
+        None
+        """
+        self._host: str = host
+        self._port: int = port
+        self._max_retries: int = max_retries
+        self._max_backoff: int = max_backoff
+        self._default_connect_timeout: float = default_connect_timeout
+        self._default_read_timeout: Optional[float] = default_read_timeout
+        self._http_allocator: Optional[Callable[[], Any]] = http_allocator
+        self._timeout: Tuple[float, Optional[float]] = (self._default_connect_timeout, default_read_timeout)
+        if self._http_allocator is None:
+            self._client: Any = requests.Session()
+            logger.debug("RestClient initialized using default requests.Session.")
+        else:
+            try:
+                self._client = self._http_allocator()
+                logger.debug(f"RestClient initialized using provided http_allocator: {self._http_allocator.__name__}")
+                if not isinstance(self._client, requests.Session):
+                    logger.warning(
+                        "Provided http_allocator does not create a requests.Session. "
+                        "Internal HTTP calls may fail if the client API is incompatible."
+                    )
+            except Exception as e:
+                logger.exception(
+                    f"Failed to instantiate client using provided http_allocator: {e}. "
+                    f"Falling back to requests.Session."
+                )
+                self._client = requests.Session()
+        self._submit_endpoint: str = "/v1/submit_job"
+        self._fetch_endpoint: str = "/v1/fetch_job"
+        self._base_url: str = kwargs.get("base_url") or self._generate_url(self._host, self._port)
         self._headers = kwargs.get("headers", {})
         self._auth = kwargs.get("auth", None)
-    def _connect(self) -> None:
+        logger.debug(f"RestClient base URL set to: {self._base_url}")
+    @staticmethod
+    def _generate_url(host: str, port: int) -> str:
         """
-        Attempts to reconnect to the HTTP server if the current connection is not responsive.
+        Constructs a base URL from host and port, intelligently handling schemes and existing ports.
+        Parameters
+        ----------
+        host : str
+            Hostname, IP address, or full URL (e.g., "localhost", "192.168.1.100",
+            "http://example.com", "https://api.example.com:8443/v1").
+        port : int
+            The default port number to use if the host string does not explicitly specify one.
+        Returns
+        -------
+        str
+            A fully constructed base URL string, including scheme, hostname, port,
+            and any original path, without a trailing slash.
+        Raises
+        ------
+        ValueError
+            If the host string appears to be a URL but lacks a valid hostname.
         """
-        ping_result = self.ping()
+        url_str: str = str(host).strip()
+        scheme: str = "http"
+        parsed_path: Optional[str] = None
+        effective_port: int = port
+        hostname: Optional[str] = None
+        if re.match(r"^https?://", url_str, re.IGNORECASE):
+            parsed_url = urlparse(url_str)
+            hostname = parsed_url.hostname
+            if hostname is None:
+                raise ValueError(f"Invalid URL provided in host string: '{url_str}'. Could not parse a valid hostname.")
+            scheme = parsed_url.scheme
+            if parsed_url.port is not None:
+                effective_port = parsed_url.port
+            else:
+                effective_port = port
+            if parsed_url.path and parsed_url.path.strip("/"):
+                parsed_path = parsed_url.path
+        else:
+            hostname = url_str
+            effective_port = port
+        if not hostname:
+            raise ValueError(f"Could not determine a valid hostname from input: '{host}'")
+        base_url: str = f"{scheme}://{hostname}:{effective_port}"
+        if parsed_path:
+            if not parsed_path.startswith("/"):
+                parsed_path = "/" + parsed_path
+            base_url += parsed_path
-        if ping_result.response_code != 0:
-            logger.debug("Reconnecting to HTTP server")
-            self._client = self._http_allocator()
+        final_url: str = base_url.rstrip("/")
+        logger.debug(f"Generated base URL: {final_url}")
+        return final_url
     @property
     def max_retries(self) -> int:
+        """
+        Maximum number of retry attempts configured for operations.
+        Returns
+        -------
+        int
+            The maximum number of retries.
+        """
         return self._max_retries
     @max_retries.setter
     def max_retries(self, value: int) -> None:
+        """
+        Sets the maximum number of retry attempts.
+        Parameters
+        ----------
+        value : int
+            The new maximum number of retries. Must be a non-negative integer.
+        Raises
+        ------
+        ValueError
+            If value is not a non-negative integer.
+        """
+        if not isinstance(value, int) or value < 0:
+            raise ValueError("max_retries must be a non-negative integer.")
         self._max_retries = value
     def get_client(self) -> Any:
         """
-        Returns a HTTP client instance, reconnecting if necessary.
+        Returns the underlying HTTP client instance.
         Returns
         -------
         Any
-            The HTTP client instance.
+            The active HTTP client instance.
         """
-        if self._client is None:
-            self._connect()
         return self._client
-    def ping(self) -> ResponseSchema:
+    def ping(self) -> "ResponseSchema":
         """
-        Checks if the HTTP server is responsive.
+        Checks if the HTTP server endpoint is responsive using an HTTP GET request.
         Returns
         -------
-        bool
-            True if the server responds to a ping, False otherwise.
+        ResponseSchema
+            An object encapsulating the outcome:
+            - response_code = 0 indicates success (HTTP status code < 400).
+            - response_code = 1 indicates failure, with details in response_reason.
         """
+        ping_timeout: Tuple[float, float] = (min(self._default_connect_timeout, 5.0), 10.0)
+        logger.debug(f"Attempting to ping server at {self._base_url} with timeout {ping_timeout}")
         try:
-            # Implement a simple GET request to a health endpoint or root
-            self._client.ping()
-            return ResponseSchema(response_code=0)
-        except (httpx.HTTPError, AttributeError):
-            return ResponseSchema(response_code=1, response_reason="Failed to ping HTTP server")
-    @staticmethod
-    def generate_url(user_provided_url, user_provided_port) -> str:
-        """Examines the user defined URL for http*://. If that
-        pattern is detected the URL is used as provided by the user.
-        If that pattern does not exist then the assumption is made that
-        the endpoint is simply `http://` and that is prepended
-        to the user supplied endpoint.
-        Args:
-            user_provided_url str: Endpoint where the Rest service is running
-        Returns:
-            str: Fully validated URL
+            if isinstance(self._client, requests.Session):
+                response: requests.Response = self._client.get(self._base_url, timeout=ping_timeout)
+                response.raise_for_status()
+                logger.debug(f"Ping successful to {self._base_url} (Status: {response.status_code})")
+                return ResponseSchema(response_code=0, response_reason="Ping OK")
+        except requests.exceptions.RequestException as e:
+            error_reason: str = f"Ping failed due to RequestException for {self._base_url}: {e}"
+            logger.warning(error_reason)
+            return ResponseSchema(response_code=1, response_reason=error_reason)
+        except Exception as e:
+            error_reason: str = f"Unexpected error during ping to {self._base_url}: {e}"
+            logger.exception(error_reason)
+            return ResponseSchema(response_code=1, response_reason=error_reason)
+    def fetch_message(
+        self, job_id: str, timeout: Optional[Union[float, Tuple[float, float]]] = None
+    ) -> "ResponseSchema":
         """
-        if not re.match(r"^https?://", user_provided_url):
-            # Add the default `http://` if it's not already present in the URL
-            user_provided_url = f"http://{user_provided_url}:{user_provided_port}"
-        else:
-            user_provided_url = f"{user_provided_url}:{user_provided_port}"
-        return user_provided_url
+        Fetches a job result message from the server's fetch endpoint.
-    def fetch_message(self, job_id: str, timeout: float = (10, 600)) -> ResponseSchema:
-        """
-        Fetches a message from the specified queue with retries on failure, handling streaming HTTP responses.
+        Handles retries for connection errors and non-terminal HTTP errors based on the max_retries configuration.
+        Specific HTTP statuses are treated as immediate failures (terminal) or as job not ready (HTTP 202).
         Parameters
         ----------
         job_id : str
-            The server-side job identifier.
-        timeout : float
-            The timeout in seconds for blocking until a message is available.
+            The server-assigned identifier of the job to fetch.
+        timeout : float or tuple of float, optional
+            Specific timeout override for this request.
         Returns
         -------
         ResponseSchema
-            The fetched message wrapped in a ResponseSchema object.
-        """
-        retries = 0
-        url = f"{self._base_url}{self._fetch_endpoint}/{job_id}"
+            - response_code = 0: Success (HTTP 200) with the job result.
+            - response_code = 1: Terminal failure (e.g., 404, 400, 5xx, or max retries exceeded).
+            - response_code = 2: Job not ready (HTTP 202).
+        Raises
+        ------
+        TypeError
+            If the configured client does not support the required HTTP GET method.
+        """
         # Ensure headers are included
         headers = {"Content-Type": "application/json"}
         headers.update(self._headers)
-        while True:
-            try:
-                logger.debug(f"Invoking fetch_message http endpoint @ '{url}'")
-                # Fetch using streaming response
-                with requests.get(
-                    url,
-                    timeout=(30, 600),
-                    stream=True,
-                    headers=headers,
-                    auth=self._auth,
-                ) as result:
-                    response_code = result.status_code
-                    if response_code in _TERMINAL_RESPONSE_STATUSES:
-                        # Terminal response code; return error ResponseSchema
-                        return ResponseSchema(
-                            response_code=1,
-                            response_reason=(
-                                f"Terminal response code {response_code} received when fetching JobSpec: {job_id}"
-                            ),
-                            response=result.text,
-                        )
-                    if response_code == 200:
-                        # Handle streaming response, reconstructing payload incrementally
-                        response_chunks = []
-                        for chunk in result.iter_content(chunk_size=1024 * 1024):  # 1MB chunks
-                            if chunk:
-                                response_chunks.append(chunk)
-                        full_response = b"".join(response_chunks).decode("utf-8")
+        retries: int = 0
+        url: str = f"{self._base_url}{self._fetch_endpoint}/{job_id}"
+        req_timeout: Tuple[float, Optional[float]] = self._timeout
-                        return ResponseSchema(
-                            response_code=0,
-                            response_reason="OK",
-                            response=full_response,
-                        )
-                    elif response_code == 202:
-                        # Job is not ready yet
-                        return ResponseSchema(
-                            response_code=1,
-                            response_reason="Job is not ready yet. Retry later.",
-                        )
+        while True:
+            result: Optional[Any] = None
+            trace_id: Optional[str] = None
+            response_code: int = -1
-                    else:
-                        try:
-                            # Retry the operation
-                            retries = self.perform_retry_backoff(retries)
-                        except RuntimeError as rte:
-                            raise rte
-            except (ConnectionError, requests.HTTPError, requests.exceptions.ConnectionError) as err:
-                logger.error(f"Error during fetching, retrying... Error: {err}")
-                self._client = None  # Invalidate client to force reconnection
-                if "Connection refused" in str(err):
-                    logger.debug(
-                        "Connection refused encountered during fetch; sleeping for 10 seconds before retrying."
+            try:
+                if isinstance(self._client, requests.Session):
+                    with self._client.get(
+                        url, timeout=req_timeout, headers=headers, stream=True, auth=self._auth
+                    ) as result:
+                        response_code = result.status_code
+                        response_text = result.text
+                        if response_code in _TERMINAL_RESPONSE_STATUSES:
+                            error_reason: str = f"Terminal response code {response_code} fetching {job_id}."
+                            logger.error(f"{error_reason} Response: {response_text[:200]}")
+                            return ResponseSchema(
+                                response_code=1, response_reason=error_reason, response=response_text, trace_id=trace_id
+                            )
+                        elif response_code == 200:
+                            try:
+                                full_response: str = b"".join(c for c in result.iter_content(1024 * 1024) if c).decode(
+                                    "utf-8"
+                                )
+                                return ResponseSchema(
+                                    response_code=0, response_reason="OK", response=full_response, trace_id=trace_id
+                                )
+                            except Exception as e:
+                                logger.error(f"Stream processing error for {job_id}: {e}")
+                                return ResponseSchema(
+                                    response_code=1, response_reason=f"Stream processing error: {e}", trace_id=trace_id
+                                )
+                        elif response_code == 202:
+                            logger.debug(f"Job {job_id} not ready (202)")
+                            return ResponseSchema(
+                                response_code=2, response_reason="Job not ready yet. Retry later.", trace_id=trace_id
+                            )
+                        else:
+                            logger.warning(f"Unexpected status {response_code} for {job_id}. Retrying if possible.")
+                else:
+                    raise TypeError(
+                        f"Unsupported client type for fetch_message: {type(self._client)}. "
+                        f"Requires a requests.Session compatible API."
                     )
-                    time.sleep(10)
+            except requests.exceptions.RequestException as err:
+                logger.debug(
+                    f"RequestException fetching {job_id}: {err}. "
+                    f"Attempting retry ({retries + 1}/{self._max_retries})..."
+                )
                 try:
                     retries = self.perform_retry_backoff(retries)
+                    continue
                 except RuntimeError as rte:
-                    # Max retries reached
+                    logger.error(f"Max retries hit fetching {job_id} after RequestException: {rte}")
                     return ResponseSchema(response_code=1, response_reason=str(rte), response=str(err))
-                except TimeoutError:
-                    raise
             except Exception as e:
-                # Handle non-http specific exceptions
-                logger.error(f"Unexpected error during fetch from {url}: {e}")
+                logger.exception(f"Unexpected error fetching {job_id}: {e}")
+                return ResponseSchema(response_code=1, response_reason=f"Unexpected fetch error: {e}")
+            try:
+                retries = self.perform_retry_backoff(retries)
+                continue
+            except RuntimeError as rte:
+                logger.error(f"Max retries hit fetching {job_id} after HTTP {response_code}: {rte}")
+                resp_text_snippet: Optional[str] = response_text[:500] if "response_text" in locals() else None
                 return ResponseSchema(
-                    response_code=1, response_reason=f"Unexpected error during fetch: {e}", response=None
+                    response_code=1,
+                    response_reason=f"Max retries after HTTP {response_code}: {rte}",
+                    response=resp_text_snippet,
+                    trace_id=trace_id,
                 )
-    def submit_message(self, channel_name: str, message: str, for_nv_ingest: bool = False) -> ResponseSchema:
+    def submit_message(
+        self,
+        channel_name: str,
+        message: str,
+        for_nv_ingest: bool = False,
+        timeout: Optional[Union[float, Tuple[float, float]]] = None,
+    ) -> "ResponseSchema":
         """
-        Submits a JobSpec to a specified HTTP endpoint with retries on failure.
+        Submits a job message payload to the server's submit endpoint.
+        Handles retries for connection errors and non-terminal HTTP errors based on the max_retries configuration.
+        Specific HTTP statuses are treated as immediate failures.
         Parameters
         ----------
         channel_name : str
-            Not used as part of RestClient but defined in MessageClientBase.
+            Not used by RestClient; included for interface compatibility.
         message : str
-            The message to submit.
-        for_nv_ingest : bool
-            Not used as part of RestClient but defined in MessageClientBase.
+            The JSON string representing the job specification payload.
+        for_nv_ingest : bool, optional
+            Not used by RestClient. Default is False.
+        timeout : float or tuple of float, optional
+            Specific timeout override for this request.
         Returns
         -------
         ResponseSchema
-            The response from the server wrapped in a ResponseSchema object.
+            - response_code = 0: Success (HTTP 200) with a successful job submission.
+            - response_code = 1: Terminal failure (e.g., 422, 400, 5xx, or max retries exceeded).
+        Raises
+        ------
+        TypeError
+            If the configured client does not support the required HTTP POST method.
         """
-        retries = 0
-        url = f"{self._base_url}{self._submit_endpoint}"
+        retries: int = 0
+        url: str = f"{self._base_url}{self._submit_endpoint}"
+        headers: Dict[str, str] = {"Content-Type": "application/json"}
+        request_payload: Dict[str, str] = {"payload": message}
+        req_timeout: Tuple[float, Optional[float]] = self._timeout
         # Ensure content-type is present
         headers = {"Content-Type": "application/json"}
         headers.update(self._headers)
         while True:
-            try:
-                # Submit via HTTP
-                result = requests.post(
-                    url,
-                    json={"payload": message},
-                    headers=headers,
-                    auth=self._auth,
-                    timeout=self._connection_timeout,
-                )
+            result: Optional[Any] = None
+            trace_id: Optional[str] = None
+            response_code: int = -1
-                response_code = result.status_code
-                if response_code in _TERMINAL_RESPONSE_STATUSES:
-                    # Terminal response code; return error ResponseSchema
-                    return ResponseSchema(
-                        response_code=1,
-                        response_reason=f"Terminal response code {response_code} received when submitting JobSpec",
-                        trace_id=result.headers.get("x-trace-id"),
+            try:
+                if isinstance(self._client, requests.Session):
+                    result = self._client.post(
+                        url,
+                        json=request_payload,
+                        headers=headers,
+                        auth=self._auth,
+                        timeout=req_timeout,
                     )
-                else:
-                    # If 200 we are good, otherwise let's try again
-                    if response_code == 200:
-                        logger.debug(f"JobSpec successfully submitted to http endpoint {self._submit_endpoint}")
-                        # The REST interface returns a JobId, so we capture that here
-                        x_trace_id = result.headers.get("x-trace-id")
+                    response_code = result.status_code
+                    trace_id = result.headers.get("x-trace-id")
+                    response_text: str = result.text
+                    if response_code in _TERMINAL_RESPONSE_STATUSES:
+                        error_reason: str = f"Terminal response code {response_code} submitting job."
+                        logger.error(f"{error_reason} Response: {response_text[:200]}")
+                        return ResponseSchema(
+                            response_code=1, response_reason=error_reason, response=response_text, trace_id=trace_id
+                        )
+                    elif response_code == 200:
+                        server_job_id_raw: str = response_text
+                        cleaned_job_id: str = server_job_id_raw.strip('"')
+                        logger.debug(f"Submit successful. Server Job ID: {cleaned_job_id}, Trace: {trace_id}")
                         return ResponseSchema(
                             response_code=0,
                             response_reason="OK",
-                            response=result.text,
-                            transaction_id=result.text,
-                            trace_id=x_trace_id,
+                            response=server_job_id_raw,
+                            transaction_id=cleaned_job_id,
+                            trace_id=trace_id,
                         )
                     else:
-                        # Retry the operation
-                        retries = self.perform_retry_backoff(retries)
-            except requests.RequestException as e:
-                logger.error(f"Failed to submit job, retrying... Error: {e}")
-                self._client = None  # Invalidate client to force reconnection
-                if "Connection refused" in str(e):
-                    logger.debug(
-                        "Connection refused encountered during submission; sleeping for 10 seconds before retrying."
+                        logger.warning(f"Unexpected status {response_code} on submit. Retrying if possible.")
+                else:
+                    raise TypeError(
+                        f"Unsupported client type for submit_message: {type(self._client)}. "
+                        f"Requires a requests.Session compatible API."
                     )
-                    time.sleep(10)
+            except requests.exceptions.RequestException as err:
+                logger.warning(
+                    f"RequestException submitting job: {err}. Attempting retry ({retries + 1}/{self._max_retries})..."
+                )
                 try:
                     retries = self.perform_retry_backoff(retries)
+                    continue
                 except RuntimeError as rte:
-                    # Max retries reached
-                    return ResponseSchema(response_code=1, response_reason=str(rte), response=str(e))
+                    logger.error(f"Max retries hit submitting job after RequestException: {rte}")
+                    return ResponseSchema(response_code=1, response_reason=str(rte), response=str(err))
             except Exception as e:
-                # Handle non-http specific exceptions
-                logger.error(f"Unexpected error during submission of JobSpec to {url}: {e}")
+                logger.exception(f"Unexpected error submitting job: {e}")
+                return ResponseSchema(response_code=1, response_reason=f"Unexpected submit error: {e}")
+            try:
+                retries = self.perform_retry_backoff(retries)
+                continue
+            except RuntimeError as rte:
+                logger.error(f"Max retries hit submitting job after HTTP {response_code}: {rte}")
+                resp_text_snippet: Optional[str] = response_text[:500] if "response_text" in locals() else None
                 return ResponseSchema(
-                    response_code=1, response_reason=f"Unexpected error during JobSpec submission: {e}", response=None
+                    response_code=1,
+                    response_reason=f"Max retries after HTTP {response_code}: {rte}",
+                    response=resp_text_snippet,
+                    trace_id=trace_id,
                 )
-    def perform_retry_backoff(self, existing_retries) -> int:
+    def perform_retry_backoff(self, existing_retries: int) -> int:
         """
-        Attempts to perform a backoff retry delay. This function accepts the
-        current number of retries that have been attempted and compares
-        that with the maximum number of retries allowed. If the current
-        number of retries exceeds the max then a RuntimeError is raised.
+        Performs exponential backoff sleep if retries are permitted.
+        Calculates the delay using exponential backoff (2^existing_retries) capped by self._max_backoff.
+        Sleeps for the calculated delay if the number of existing_retries is less than max_retries.
         Parameters
         ----------
         existing_retries : int
-            The number of retries that have been attempted for this operation thus far
+            The number of retries already attempted for the current operation.
         Returns
         -------
         int
-            The updated number of retry attempts that have been made for this operation
+            The incremented retry count (existing_retries + 1).
         Raises
         ------
         RuntimeError
-            Raised if the maximum number of retry attempts has been reached.
+            If existing_retries is greater than or equal to max_retries (when max_retries > 0).
         """
-        backoff_delay = min(2**existing_retries, self._max_backoff)
+        if self._max_retries > 0 and existing_retries >= self._max_retries:
+            raise RuntimeError(f"Max retry attempts ({self._max_retries}) reached")
+        backoff_delay: int = min(2**existing_retries, self._max_backoff)
+        retry_attempt_num: int = existing_retries + 1
         logger.debug(
-            f"Retry #: {existing_retries} of max_retries: {self.max_retries} | "
-            f"current backoff_delay: {backoff_delay}s of max_backoff: {self._max_backoff}s"
+            f"Operation failed. Retrying attempt "
+            f"{retry_attempt_num}/{self._max_retries if self._max_retries > 0 else 'infinite'} "
+            f"in {backoff_delay:.2f}s..."
         )
-        if self.max_retries > 0 and existing_retries < self.max_retries:
-            logger.error(f"Operation failed, retrying in {backoff_delay}s...")
-            time.sleep(backoff_delay)
-            return existing_retries + 1
-        else:
-            raise RuntimeError(f"Max retry attempts of {self.max_retries} reached")
+        time.sleep(backoff_delay)
+        return retry_attempt_num