PyPI - rasa-pro - Versions diffs - 3.14.0rc4__py3-none-any.whl → 3.14.2__py3-none-any.whl - Mend

rasa-pro 3.14.0rc4py3-none-any.whl → 3.14.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of rasa-pro might be problematic. Click here for more details.

Files changed (79) hide show

rasa/agents/agent_manager.py +7 -5
rasa/agents/protocol/a2a/a2a_agent.py +13 -11
rasa/agents/protocol/mcp/mcp_base_agent.py +49 -11
rasa/agents/validation.py +4 -2
rasa/builder/copilot/copilot_templated_message_provider.py +1 -1
rasa/builder/validation_service.py +4 -0
rasa/cli/arguments/data.py +9 -0
rasa/cli/data.py +72 -6
rasa/cli/interactive.py +3 -0
rasa/cli/llm_fine_tuning.py +1 -0
rasa/cli/project_templates/defaults.py +1 -0
rasa/cli/validation/bot_config.py +2 -0
rasa/constants.py +2 -1
rasa/core/actions/action_clean_stack.py +32 -0
rasa/core/actions/action_exceptions.py +1 -1
rasa/core/actions/constants.py +4 -0
rasa/core/actions/custom_action_executor.py +70 -12
rasa/core/actions/grpc_custom_action_executor.py +41 -2
rasa/core/actions/http_custom_action_executor.py +49 -25
rasa/core/agent.py +4 -1
rasa/core/available_agents.py +1 -1
rasa/core/channels/voice_stream/browser_audio.py +3 -3
rasa/core/channels/voice_stream/voice_channel.py +27 -17
rasa/core/config/credentials.py +3 -3
rasa/core/exceptions.py +1 -1
rasa/core/featurizers/tracker_featurizers.py +3 -2
rasa/core/persistor.py +7 -7
rasa/core/policies/flows/agent_executor.py +84 -4
rasa/core/policies/flows/flow_exceptions.py +5 -2
rasa/core/policies/flows/flow_executor.py +52 -31
rasa/core/policies/flows/mcp_tool_executor.py +7 -1
rasa/core/policies/rule_policy.py +1 -1
rasa/core/run.py +21 -5
rasa/dialogue_understanding/commands/cancel_flow_command.py +1 -1
rasa/dialogue_understanding/generator/llm_based_command_generator.py +6 -3
rasa/dialogue_understanding/generator/single_step/compact_llm_command_generator.py +15 -7
rasa/dialogue_understanding/generator/single_step/search_ready_llm_command_generator.py +15 -8
rasa/dialogue_understanding/patterns/default_flows_for_patterns.yml +1 -1
rasa/dialogue_understanding/processor/command_processor.py +13 -7
rasa/e2e_test/e2e_config.py +4 -3
rasa/engine/recipes/default_components.py +16 -6
rasa/graph_components/validators/default_recipe_validator.py +10 -4
rasa/model_manager/runner_service.py +1 -1
rasa/nlu/classifiers/diet_classifier.py +2 -0
rasa/privacy/privacy_config.py +1 -1
rasa/shared/agents/auth/auth_strategy/oauth2_auth_strategy.py +4 -7
rasa/shared/core/flows/flow.py +8 -2
rasa/shared/core/slots.py +55 -24
rasa/shared/core/training_data/story_reader/story_reader.py +1 -1
rasa/shared/exceptions.py +23 -2
rasa/shared/providers/_configs/azure_openai_client_config.py +4 -5
rasa/shared/providers/_configs/default_litellm_client_config.py +4 -4
rasa/shared/providers/_configs/litellm_router_client_config.py +3 -2
rasa/shared/providers/_configs/openai_client_config.py +5 -7
rasa/shared/providers/_configs/rasa_llm_client_config.py +4 -4
rasa/shared/providers/_configs/self_hosted_llm_client_config.py +4 -4
rasa/shared/providers/llm/_base_litellm_client.py +42 -14
rasa/shared/providers/llm/litellm_router_llm_client.py +40 -17
rasa/shared/providers/llm/self_hosted_llm_client.py +34 -32
rasa/shared/utils/common.py +9 -1
rasa/shared/utils/configs.py +5 -8
rasa/shared/utils/llm.py +21 -4
rasa/shared/utils/mcp/server_connection.py +7 -4
rasa/studio/download.py +3 -0
rasa/studio/prompts.py +1 -0
rasa/studio/upload.py +4 -0
rasa/utils/common.py +9 -0
rasa/utils/endpoints.py +6 -0
rasa/utils/installation_utils.py +111 -0
rasa/utils/log_utils.py +20 -1
rasa/utils/tensorflow/callback.py +2 -0
rasa/utils/tensorflow/models.py +3 -0
rasa/utils/train_utils.py +2 -0
rasa/version.py +1 -1
{rasa_pro-3.14.0rc4.dist-info → rasa_pro-3.14.2.dist-info}/METADATA +3 -3
{rasa_pro-3.14.0rc4.dist-info → rasa_pro-3.14.2.dist-info}/RECORD +79 -78
{rasa_pro-3.14.0rc4.dist-info → rasa_pro-3.14.2.dist-info}/NOTICE +0 -0
{rasa_pro-3.14.0rc4.dist-info → rasa_pro-3.14.2.dist-info}/WHEEL +0 -0
{rasa_pro-3.14.0rc4.dist-info → rasa_pro-3.14.2.dist-info}/entry_points.txt +0 -0

rasa/model_manager/runner_service.py CHANGED Viewed

@@ -195,7 +195,7 @@ def fetch_remote_model_to_dir(
     try:
         return persistor.retrieve(model_name=model_name, target_path=target_path)
     except FileNotFoundError as e:
-        raise ModelNotFound() from e
+        raise ModelNotFound("Model not found") from e
 def fetch_size_of_remote_model(

rasa/nlu/classifiers/diet_classifier.py CHANGED Viewed

@@ -9,9 +9,11 @@ from typing import Any, Dict, List, Optional, Text, Tuple, Type, TypeVar, Union
 import numpy as np
 import scipy.sparse
+from rasa.utils.installation_utils import check_for_installation_issues
 from rasa.utils.tensorflow import TENSORFLOW_AVAILABLE
 if TENSORFLOW_AVAILABLE:
+    check_for_installation_issues()
     import tensorflow as tf
 else:
     tf = None

rasa/privacy/privacy_config.py CHANGED Viewed

@@ -211,7 +211,7 @@ def get_cron_trigger(cron_expression: str) -> CronTrigger:
             "privacy_config.invalid_cron_expression",
             cron=cron_expression,
         )
-        raise RasaException from exc
+        raise RasaException("Invalid cron expression") from exc
     return cron

rasa/shared/agents/auth/auth_strategy/oauth2_auth_strategy.py CHANGED Viewed

@@ -139,20 +139,17 @@ class OAuth2AuthStrategy(AgentAuthStrategy):
                 resp.raise_for_status()
                 token_data = resp.json()
         except httpx.HTTPStatusError as e:
-            raise ValueError(
-                f"OAuth2 token request failed with status {e.response.status_code}: "
-                f"{e.response.text}"
-            ) from e
+            raise e
         except httpx.RequestError as e:
-            raise ValueError(f"OAuth2 token request failed: {e}") from e
+            raise ValueError(f"OAuth2 token request failed - {e}") from e
         except Exception as e:
             raise ValueError(
-                f"Unexpected error during OAuth2 token request: {e}"
+                f"Unexpected error during OAuth2 token request - {e}"
             ) from e
         # Validate token data
         if KEY_ACCESS_TOKEN not in token_data:
-            raise ValueError(f"No {KEY_ACCESS_TOKEN} in OAuth2 response")
+            raise ValueError(f"No `{KEY_ACCESS_TOKEN}` in OAuth2 response")
         # Set access token and expires at
         self._access_token = token_data[KEY_ACCESS_TOKEN]

rasa/shared/core/flows/flow.py CHANGED Viewed

@@ -322,9 +322,15 @@ class Flow:
     def get_collect_steps(self) -> List[CollectInformationFlowStep]:
         """Return all CollectInformationFlowSteps in the flow."""
-        collect_steps = []
+        collect_steps: List[CollectInformationFlowStep] = []
         for step in self.steps_with_calls_resolved:
-            if isinstance(step, CollectInformationFlowStep):
+            # Only add collect steps that are not already in the list.
+            # This is to avoid returning duplicate collect steps from called flows
+            # in case the called flow is called multiple times.
+            if (
+                isinstance(step, CollectInformationFlowStep)
+                and step not in collect_steps
+            ):
                 collect_steps.append(step)
         return collect_steps

rasa/shared/core/slots.py CHANGED Viewed

@@ -355,8 +355,8 @@ class FloatSlot(Slot):
         mappings: List[Dict[Text, Any]],
         initial_value: Optional[float] = None,
         value_reset_delay: Optional[int] = None,
-        max_value: float = 1.0,
-        min_value: float = 0.0,
+        max_value: Optional[float] = None,
+        min_value: Optional[float] = None,
         influence_conversation: bool = True,
         is_builtin: bool = False,
         shared_for_coexistence: bool = False,
@@ -380,32 +380,24 @@ class FloatSlot(Slot):
             filled_by=filled_by,
             validation=validation,
         )
+        self.validate_min_max_range(min_value, max_value)
         self.max_value = max_value
         self.min_value = min_value
-        if min_value >= max_value:
-            raise InvalidSlotConfigError(
-                "Float slot ('{}') created with an invalid range "
-                "using min ({}) and max ({}) values. Make sure "
-                "min is smaller than max."
-                "".format(self.name, self.min_value, self.max_value)
-            )
-        if initial_value is not None and not (min_value <= initial_value <= max_value):
-            rasa.shared.utils.io.raise_warning(
-                f"Float slot ('{self.name}') created with an initial value "
-                f"{self.value}. This value is outside of the configured min "
-                f"({self.min_value}) and max ({self.max_value}) values."
-            )
     def _as_feature(self) -> List[float]:
+        # set default min and max values used in prior releases
+        # to prevent regressions for existing models
+        min_value = self.min_value or 0.0
+        max_value = self.max_value or 1.0
         try:
-            capped_value = max(self.min_value, min(self.max_value, float(self.value)))
-            if abs(self.max_value - self.min_value) > 0:
-                covered_range = abs(self.max_value - self.min_value)
+            capped_value = max(min_value, min(max_value, float(self.value)))
+            if abs(max_value - min_value) > 0:
+                covered_range = abs(max_value - min_value)
             else:
                 covered_range = 1
-            return [1.0, (capped_value - self.min_value) / covered_range]
+            return [1.0, (capped_value - min_value) / covered_range]
         except (TypeError, ValueError):
             return [0.0, 0.0]
@@ -424,13 +416,52 @@ class FloatSlot(Slot):
             return value
     def is_valid_value(self, value: Any) -> bool:
-        """Checks if the slot contains the value."""
-        # check that coerced type is float
-        return value is None or isinstance(self.coerce_value(value), float)
+        """Checks if the slot value is valid."""
+        if value is None:
+            return True
+        if not isinstance(self.coerce_value(value), float):
+            return False
+        if (
+            self.min_value is not None
+            and self.max_value is not None
+            and not (self.min_value <= value <= self.max_value)
+        ):
+            return False
+        return True
     def _feature_dimensionality(self) -> int:
         return len(self.as_feature())
+    def validate_min_max_range(
+        self, min_value: Optional[float], max_value: Optional[float]
+    ) -> None:
+        """Validates the min-max range for the slot.
+        Raises:
+            InvalidSlotConfigError, if the min-max range is invalid.
+        """
+        if min_value is not None and max_value is not None and min_value >= max_value:
+            raise InvalidSlotConfigError(
+                f"Float slot ('{self.name}') created with an invalid range "
+                f"using min ({min_value}) and max ({max_value}) values. Make sure "
+                f"min is smaller than max."
+            )
+        if (
+            self.initial_value is not None
+            and min_value is not None
+            and max_value is not None
+            and not (min_value <= self.initial_value <= max_value)
+        ):
+            raise InvalidSlotConfigError(
+                f"Float slot ('{self.name}') created with an initial value "
+                f"{self.initial_value}. This value is outside of the configured min "
+                f"({min_value}) and max ({max_value}) values."
+            )
 class BooleanSlot(Slot):
     """A slot storing a truth value."""

rasa/shared/core/training_data/story_reader/story_reader.py CHANGED Viewed

@@ -126,4 +126,4 @@ class StoryParseError(RasaCoreException, ValueError):
     def __init__(self, message: Text) -> None:
         self.message = message
-        super(StoryParseError, self).__init__()
+        super(StoryParseError, self).__init__(message)

rasa/shared/exceptions.py CHANGED Viewed

@@ -16,6 +16,17 @@ class RasaException(Exception):
     to the users, but will be ignored in telemetry.
     """
+    def __init__(self, message: str, suppress_stack_trace: bool = False, **kwargs: Any):
+        """Initialize the exception.
+        Args:
+            message: The error message.
+            suppress_stack_trace: If True, the stack trace will be suppressed in logs.
+            **kwargs: Additional keyword arguments (e.g., cause for exception chaining).
+        """
+        Exception.__init__(self, message)
+        self.suppress_stack_trace = suppress_stack_trace
 class RasaCoreException(RasaException):
     """Basic exception for errors raised by Rasa Core."""
@@ -113,6 +124,17 @@ class SchemaValidationError(RasaException, jsonschema.ValidationError):
 class InvalidEntityFormatException(RasaException, json.JSONDecodeError):
     """Raised if the format of an entity is invalid."""
+    def __init__(self, msg: str, doc: str = "", pos: int = 0):
+        """Initialize the exception.
+        Args:
+            msg: The error message.
+            doc: The document that caused the error.
+            pos: The position in the document where the error occurred.
+        """
+        RasaException.__init__(self, msg)
+        json.JSONDecodeError.__init__(self, msg, doc, pos)
     @classmethod
     def create_from(
         cls, other: json.JSONDecodeError, msg: Text
@@ -130,8 +152,7 @@ class ConnectionException(RasaException):
 class ProviderClientAPIException(RasaException):
-    """Raised for errors that occur during API interactions
-    with LLM / embedding providers.
+    """For errors during API interactions with LLM / embedding providers.
     Attributes:
         original_exception (Exception): The original exception that was

rasa/shared/providers/_configs/azure_openai_client_config.py CHANGED Viewed

@@ -167,8 +167,9 @@ class OAuthConfigWrapper(OAuth, BaseModel):
 @dataclass
 class AzureOpenAIClientConfig:
-    """Parses configuration for Azure OpenAI client, resolves aliases and
-    raises deprecation warnings.
+    """Parses configuration for Azure OpenAI client.
+    Resolves aliases and raises deprecation warnings.
     Raises:
         ValueError: Raised in cases of invalid configuration:
@@ -301,9 +302,7 @@ class AzureOpenAIClientConfig:
 def is_azure_openai_config(config: dict) -> bool:
-    """Check whether the configuration is meant to configure
-    an Azure OpenAI client.
-    """
+    """Check whether the configuration is meant to configure an Azure OpenAI client."""
     # Resolve any aliases that are specific to Azure OpenAI configuration
     config = AzureOpenAIClientConfig.resolve_config_aliases(config)

rasa/shared/providers/_configs/default_litellm_client_config.py CHANGED Viewed

@@ -40,8 +40,9 @@ FORBIDDEN_KEYS = [
 @dataclass
 class DefaultLiteLLMClientConfig:
-    """Parses configuration for default LiteLLM client, resolves aliases and
-    raises deprecation warnings.
+    """Parses configuration for default LiteLLM client.
+    Resolves aliases and raises deprecation warnings.
     Raises:
         ValueError: Raised in cases of invalid configuration:
@@ -72,8 +73,7 @@ class DefaultLiteLLMClientConfig:
     @classmethod
     def from_dict(cls, config: dict) -> DefaultLiteLLMClientConfig:
-        """
-        Initializes a dataclass from the passed config.
+        """Initializes a dataclass from the passed config.
         Args:
             config: (dict) The config from which to initialize.

rasa/shared/providers/_configs/litellm_router_client_config.py CHANGED Viewed

@@ -38,8 +38,9 @@ _LITELLM_UNSUPPORTED_KEYS = [
 @dataclass
 class LiteLLMRouterClientConfig:
-    """Parses configuration for a LiteLLM Router client. The configuration is expected
-    to be in the following format:
+    """Parses configuration for a LiteLLM Router client.
+    The configuration is expected to be in the following format:
     {
         "id": "model_group_id",

rasa/shared/providers/_configs/openai_client_config.py CHANGED Viewed

@@ -64,8 +64,9 @@ FORBIDDEN_KEYS = [
 @dataclass
 class OpenAIClientConfig:
-    """Parses configuration for Azure OpenAI client, resolves aliases and
-    raises deprecation warnings.
+    """Parses configuration for OpenAI client.
+    Resolves aliases and raises deprecation warnings.
     Raises:
         ValueError: Raised in cases of invalid configuration:
@@ -118,8 +119,7 @@ class OpenAIClientConfig:
     @classmethod
     def from_dict(cls, config: dict) -> OpenAIClientConfig:
-        """
-        Initializes a dataclass from the passed config.
+        """Initializes a dataclass from the passed config.
         Args:
             config: (dict) The config from which to initialize.
@@ -168,9 +168,7 @@ class OpenAIClientConfig:
 def is_openai_config(config: dict) -> bool:
-    """Check whether the configuration is meant to configure
-    an OpenAI client.
-    """
+    """Check whether the configuration is meant to configure an OpenAI client."""
     # Process the config to handle all the aliases
     config = OpenAIClientConfig.resolve_config_aliases(config)

rasa/shared/providers/_configs/rasa_llm_client_config.py CHANGED Viewed

@@ -22,8 +22,9 @@ structlogger = structlog.get_logger()
 @dataclass
 class RasaLLMClientConfig:
-    """Parses configuration for a Rasa Hosted LiteLLM client,
-    checks required keys present.
+    """Parses configuration for a Rasa Hosted LiteLLM client.
+    Checks required keys present.
     Raises:
         ValueError: Raised in cases of invalid configuration:
@@ -40,8 +41,7 @@ class RasaLLMClientConfig:
     @classmethod
     def from_dict(cls, config: dict) -> RasaLLMClientConfig:
-        """
-        Initializes a dataclass from the passed config.
+        """Initializes a dataclass from the passed config.
         Args:
             config: (dict) The config from which to initialize.

rasa/shared/providers/_configs/self_hosted_llm_client_config.py CHANGED Viewed

@@ -61,8 +61,9 @@ FORBIDDEN_KEYS = [
 @dataclass
 class SelfHostedLLMClientConfig:
-    """Parses configuration for Self Hosted LiteLLM client, resolves aliases and
-    raises deprecation warnings.
+    """Parses configuration for Self Hosted LiteLLM client.
+    Resolves aliases and raises deprecation warnings.
     Raises:
         ValueError: Raised in cases of invalid configuration:
@@ -116,8 +117,7 @@ class SelfHostedLLMClientConfig:
     @classmethod
     def from_dict(cls, config: dict) -> SelfHostedLLMClientConfig:
-        """
-        Initializes a dataclass from the passed config.
+        """Initializes a dataclass from the passed config.
         Args:
             config: (dict) The config from which to initialize.

rasa/shared/providers/llm/_base_litellm_client.py CHANGED Viewed

@@ -1,12 +1,14 @@
 from __future__ import annotations
+import asyncio
 import logging
 from abc import abstractmethod
-from typing import Any, Dict, List, Union, cast
+from typing import Any, Dict, List, NoReturn, Union, cast
 import structlog
 from litellm import acompletion, completion, validate_environment
+from rasa.core.constants import DEFAULT_REQUEST_TIMEOUT
 from rasa.shared.constants import (
     _VALIDATE_ENVIRONMENT_MISSING_KEYS_KEY,
     API_BASE_CONFIG_KEY,
@@ -57,26 +59,24 @@ class _BaseLiteLLMClient:
     @property
     @abstractmethod
     def config(self) -> dict:
-        """Returns the configuration for that the llm client
-        in dictionary form.
-        """
+        """Returns the configuration for that the llm client in dictionary form."""
         pass
     @property
     @abstractmethod
     def _litellm_model_name(self) -> str:
-        """Returns the value of LiteLLM's model parameter to be used in
-        completion/acompletion in LiteLLM format:
+        """Returns the value of LiteLLM's model parameter.
+        To be used in completion/acompletion in LiteLLM format:
         <provider>/<model or deployment name>
         """
         pass
     @property
     def _litellm_extra_parameters(self) -> Dict[str, Any]:
-        """Returns a dictionary of extra parameters which include model
-        parameters as well as LiteLLM specific input parameters.
+        """Returns a dictionary of extra parameters.
+        Includes model parameters as well as LiteLLM specific input parameters.
         By default, this returns an empty dictionary (no extra parameters).
         """
         return {}
@@ -96,8 +96,9 @@ class _BaseLiteLLMClient:
         }
     def validate_client_setup(self) -> None:
-        """Perform client validation. By default only environment variables
-        are validated.
+        """Perform client validation.
+        By default only environment variables are validated.
         Raises:
             ProviderClientValidationError if validation fails.
@@ -188,10 +189,17 @@ class _BaseLiteLLMClient:
             arguments = cast(
                 Dict[str, Any], resolve_environment_variables(self._completion_fn_args)
             )
-            response = await acompletion(
-                messages=formatted_messages, **{**arguments, **kwargs}
+            timeout = self._litellm_extra_parameters.get(
+                "timeout", DEFAULT_REQUEST_TIMEOUT
+            )
+            response = await asyncio.wait_for(
+                acompletion(messages=formatted_messages, **{**arguments, **kwargs}),
+                timeout=timeout,
             )
             return self._format_response(response)
+        except asyncio.TimeoutError:
+            self._handle_timeout_error()
         except Exception as e:
             message = ""
             from rasa.shared.providers.llm.self_hosted_llm_client import (
@@ -211,6 +219,25 @@ class _BaseLiteLLMClient:
                 )
             raise ProviderClientAPIException(e, message) from e
+    def _handle_timeout_error(self) -> NoReturn:
+        """Handle asyncio.TimeoutError and raise ProviderClientAPIException.
+        Raises:
+            ProviderClientAPIException: Always raised with formatted timeout error.
+        """
+        timeout = self._litellm_extra_parameters.get("timeout", DEFAULT_REQUEST_TIMEOUT)
+        error_message = (
+            f"APITimeoutError - Request timed out. Error_str: "
+            f"Request timed out. - timeout value={timeout:.6f}, "
+            f"time taken={timeout:.6f} seconds"
+        )
+        # nosemgrep: semgrep.rules.pii-positional-arguments-in-logging
+        # Error message contains only numeric timeout values, not PII
+        structlogger.error(
+            f"{self.__class__.__name__.lower()}.llm.timeout", error=error_message
+        )
+        raise ProviderClientAPIException(asyncio.TimeoutError(error_message)) from None
     def _get_formatted_messages(
         self, messages: Union[List[dict], List[str], str]
     ) -> List[Dict[str, str]]:
@@ -312,8 +339,9 @@ class _BaseLiteLLMClient:
     @staticmethod
     def _ensure_certificates() -> None:
-        """Configures SSL certificates for LiteLLM. This method is invoked during
-        client initialization.
+        """Configures SSL certificates for LiteLLM.
+        This method is invoked during client initialization.
         LiteLLM may utilize `openai` clients or other providers that require
         SSL verification settings through the `SSL_VERIFY` / `SSL_CERTIFICATE`

rasa/shared/providers/llm/litellm_router_llm_client.py CHANGED Viewed

@@ -1,10 +1,12 @@
 from __future__ import annotations
+import asyncio
 import logging
 from typing import Any, Dict, List, Union
 import structlog
+from rasa.core.constants import DEFAULT_REQUEST_TIMEOUT
 from rasa.shared.exceptions import ProviderClientAPIException
 from rasa.shared.providers._configs.litellm_router_client_config import (
     LiteLLMRouterClientConfig,
@@ -79,13 +81,14 @@ class LiteLLMRouterLLMClient(_BaseLiteLLMRouterClient, _BaseLiteLLMClient):
     @suppress_logs(log_level=logging.WARNING)
     def _text_completion(self, prompt: Union[List[str], str]) -> LLMResponse:
-        """
-        Synchronously generate completions for given prompt.
+        """Synchronously generate completions for given prompt.
         Args:
             prompt: Prompt to generate the completion for.
         Returns:
             List of message completions.
         Raises:
             ProviderClientAPIException: If the API request fails.
         """
@@ -103,21 +106,30 @@ class LiteLLMRouterLLMClient(_BaseLiteLLMRouterClient, _BaseLiteLLMClient):
     @suppress_logs(log_level=logging.WARNING)
     async def _atext_completion(self, prompt: Union[List[str], str]) -> LLMResponse:
-        """
-        Asynchronously generate completions for given prompt.
+        """Asynchronously generate completions for given prompt.
         Args:
             prompt: Prompt to generate the completion for.
         Returns:
             List of message completions.
         Raises:
             ProviderClientAPIException: If the API request fails.
         """
         try:
-            response = await self.router_client.atext_completion(
-                prompt=prompt, **self._completion_fn_args
+            timeout = self._litellm_extra_parameters.get(
+                "timeout", DEFAULT_REQUEST_TIMEOUT
+            )
+            response = await asyncio.wait_for(
+                self.router_client.atext_completion(
+                    prompt=prompt, **self._completion_fn_args
+                ),
+                timeout=timeout,
             )
             return self._format_text_completion_response(response)
+        except asyncio.TimeoutError:
+            self._handle_timeout_error()
         except Exception as e:
             raise ProviderClientAPIException(e)
@@ -125,8 +137,7 @@ class LiteLLMRouterLLMClient(_BaseLiteLLMRouterClient, _BaseLiteLLMClient):
     def completion(
         self, messages: Union[List[dict], List[str], str], **kwargs: Any
     ) -> LLMResponse:
-        """
-        Synchronously generate completions for given list of messages.
+        """Synchronously generate completions for given list of messages.
         Method overrides the base class method to call the appropriate
         completion method based on the configuration. If the chat completions
@@ -143,15 +154,17 @@ class LiteLLMRouterLLMClient(_BaseLiteLLMRouterClient, _BaseLiteLLMClient):
                     as a user message.
                 - a single message as a string which will be formatted as user message.
             **kwargs: Additional parameters to pass to the completion call.
         Returns:
             List of message completions.
         Raises:
             ProviderClientAPIException: If the API request fails.
         """
         if not self._use_chat_completions_endpoint:
             return self._text_completion(messages)
         try:
-            formatted_messages = self._format_messages(messages)
+            formatted_messages = self._get_formatted_messages(messages)
             response = self.router_client.completion(
                 messages=formatted_messages, **{**self._completion_fn_args, **kwargs}
             )
@@ -163,8 +176,7 @@ class LiteLLMRouterLLMClient(_BaseLiteLLMRouterClient, _BaseLiteLLMClient):
     async def acompletion(
         self, messages: Union[List[dict], List[str], str], **kwargs: Any
     ) -> LLMResponse:
-        """
-        Asynchronously generate completions for given list of messages.
+        """Asynchronously generate completions for given list of messages.
         Method overrides the base class method to call the appropriate
         completion method based on the configuration. If the chat completions
@@ -181,28 +193,39 @@ class LiteLLMRouterLLMClient(_BaseLiteLLMRouterClient, _BaseLiteLLMClient):
                     as a user message.
                 - a single message as a string which will be formatted as user message.
             **kwargs: Additional parameters to pass to the completion call.
         Returns:
             List of message completions.
         Raises:
             ProviderClientAPIException: If the API request fails.
         """
         if not self._use_chat_completions_endpoint:
             return await self._atext_completion(messages)
         try:
-            formatted_messages = self._format_messages(messages)
-            response = await self.router_client.acompletion(
-                messages=formatted_messages, **{**self._completion_fn_args, **kwargs}
+            formatted_messages = self._get_formatted_messages(messages)
+            timeout = self._litellm_extra_parameters.get(
+                "timeout", DEFAULT_REQUEST_TIMEOUT
+            )
+            response = await asyncio.wait_for(
+                self.router_client.acompletion(
+                    messages=formatted_messages,
+                    **{**self._completion_fn_args, **kwargs},
+                ),
+                timeout=timeout,
             )
             return self._format_response(response)
+        except asyncio.TimeoutError:
+            self._handle_timeout_error()
         except Exception as e:
             raise ProviderClientAPIException(e)
     @property
     def _completion_fn_args(self) -> Dict[str, Any]:
-        """Returns the completion arguments for invoking a call through
-        LiteLLM's completion functions.
-        """
+        """Returns the completion arguments.
+        For invoking a call through LiteLLM's completion functions.
+        """
         return {
             **self._litellm_extra_parameters,
             LITE_LLM_MODEL_FIELD: self.model_group_id,

rasa-pro 3.14.0rc4__py3-none-any.whl → 3.14.2__py3-none-any.whl

Potentially problematic release.

rasa-pro 3.14.0rc4py3-none-any.whl → 3.14.2py3-none-any.whl