PyPI - rasa-pro - Versions diffs - 3.10.16__py3-none-any.whl → 3.11.0__py3-none-any.whl - Mend

rasa-pro 3.10.16py3-none-any.whl → 3.11.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of rasa-pro might be problematic. Click here for more details.

Files changed (240) hide show

rasa/__main__.py +31 -15
rasa/api.py +12 -2
rasa/cli/arguments/default_arguments.py +24 -4
rasa/cli/arguments/run.py +15 -0
rasa/cli/arguments/shell.py +5 -1
rasa/cli/arguments/train.py +17 -9
rasa/cli/evaluate.py +7 -7
rasa/cli/inspect.py +19 -7
rasa/cli/interactive.py +1 -0
rasa/cli/llm_fine_tuning.py +11 -14
rasa/cli/project_templates/calm/config.yml +5 -7
rasa/cli/project_templates/calm/endpoints.yml +15 -2
rasa/cli/project_templates/tutorial/config.yml +8 -5
rasa/cli/project_templates/tutorial/data/flows.yml +1 -1
rasa/cli/project_templates/tutorial/data/patterns.yml +5 -0
rasa/cli/project_templates/tutorial/domain.yml +14 -0
rasa/cli/project_templates/tutorial/endpoints.yml +5 -0
rasa/cli/run.py +7 -0
rasa/cli/scaffold.py +4 -2
rasa/cli/studio/upload.py +0 -15
rasa/cli/train.py +14 -53
rasa/cli/utils.py +14 -11
rasa/cli/x.py +7 -7
rasa/constants.py +3 -1
rasa/core/actions/action.py +77 -33
rasa/core/actions/action_hangup.py +29 -0
rasa/core/actions/action_repeat_bot_messages.py +89 -0
rasa/core/actions/e2e_stub_custom_action_executor.py +5 -1
rasa/core/actions/http_custom_action_executor.py +4 -0
rasa/core/agent.py +2 -2
rasa/core/brokers/kafka.py +3 -1
rasa/core/brokers/pika.py +3 -1
rasa/core/channels/__init__.py +10 -6
rasa/core/channels/channel.py +41 -4
rasa/core/channels/development_inspector.py +150 -46
rasa/core/channels/inspector/README.md +1 -1
rasa/core/channels/inspector/dist/assets/{arc-b6e548fe.js → arc-bc141fb2.js} +1 -1
rasa/core/channels/inspector/dist/assets/{c4Diagram-d0fbc5ce-fa03ac9e.js → c4Diagram-d0fbc5ce-be2db283.js} +1 -1
rasa/core/channels/inspector/dist/assets/{classDiagram-936ed81e-ee67392a.js → classDiagram-936ed81e-55366915.js} +1 -1
rasa/core/channels/inspector/dist/assets/{classDiagram-v2-c3cb15f1-9b283fae.js → classDiagram-v2-c3cb15f1-bb529518.js} +1 -1
rasa/core/channels/inspector/dist/assets/{createText-62fc7601-8b6fcc2a.js → createText-62fc7601-b0ec81d6.js} +1 -1
rasa/core/channels/inspector/dist/assets/{edges-f2ad444c-22e77f4f.js → edges-f2ad444c-6166330c.js} +1 -1
rasa/core/channels/inspector/dist/assets/{erDiagram-9d236eb7-60ffc87f.js → erDiagram-9d236eb7-5ccc6a8e.js} +1 -1
rasa/core/channels/inspector/dist/assets/{flowDb-1972c806-9dd802e4.js → flowDb-1972c806-fca3bfe4.js} +1 -1
rasa/core/channels/inspector/dist/assets/{flowDiagram-7ea5b25a-5fa1912f.js → flowDiagram-7ea5b25a-4739080f.js} +1 -1
rasa/core/channels/inspector/dist/assets/flowDiagram-v2-855bc5b3-736177bf.js +1 -0
rasa/core/channels/inspector/dist/assets/{flowchart-elk-definition-abe16c3d-622a1fd2.js → flowchart-elk-definition-abe16c3d-7c1b0e0f.js} +1 -1
rasa/core/channels/inspector/dist/assets/{ganttDiagram-9b5ea136-e285a63a.js → ganttDiagram-9b5ea136-772fd050.js} +1 -1
rasa/core/channels/inspector/dist/assets/{gitGraphDiagram-99d0ae7c-f237bdca.js → gitGraphDiagram-99d0ae7c-8eae1dc9.js} +1 -1
rasa/core/channels/inspector/dist/assets/{index-2c4b9a3b-4b03d70e.js → index-2c4b9a3b-f55afcdf.js} +1 -1
rasa/core/channels/inspector/dist/assets/index-e7cef9de.js +1317 -0
rasa/core/channels/inspector/dist/assets/{infoDiagram-736b4530-72a0fa5f.js → infoDiagram-736b4530-124d4a14.js} +1 -1
rasa/core/channels/inspector/dist/assets/{journeyDiagram-df861f2b-82218c41.js → journeyDiagram-df861f2b-7c4fae44.js} +1 -1
rasa/core/channels/inspector/dist/assets/{layout-78cff630.js → layout-b9885fb6.js} +1 -1
rasa/core/channels/inspector/dist/assets/{line-5038b469.js → line-7c59abb6.js} +1 -1
rasa/core/channels/inspector/dist/assets/{linear-c4fc4098.js → linear-4776f780.js} +1 -1
rasa/core/channels/inspector/dist/assets/{mindmap-definition-beec6740-c33c8ea6.js → mindmap-definition-beec6740-2332c46c.js} +1 -1
rasa/core/channels/inspector/dist/assets/{pieDiagram-dbbf0591-a8d03059.js → pieDiagram-dbbf0591-8fb39303.js} +1 -1
rasa/core/channels/inspector/dist/assets/{quadrantDiagram-4d7f4fd6-6a0e56b2.js → quadrantDiagram-4d7f4fd6-3c7180a2.js} +1 -1
rasa/core/channels/inspector/dist/assets/{requirementDiagram-6fc4c22a-2dc7c7bd.js → requirementDiagram-6fc4c22a-e910bcb8.js} +1 -1
rasa/core/channels/inspector/dist/assets/{sankeyDiagram-8f13d901-2360fe39.js → sankeyDiagram-8f13d901-ead16c89.js} +1 -1
rasa/core/channels/inspector/dist/assets/{sequenceDiagram-b655622a-41b9f9ad.js → sequenceDiagram-b655622a-29a02a19.js} +1 -1
rasa/core/channels/inspector/dist/assets/{stateDiagram-59f0c015-0aad326f.js → stateDiagram-59f0c015-042b3137.js} +1 -1
rasa/core/channels/inspector/dist/assets/{stateDiagram-v2-2b26beab-9847d984.js → stateDiagram-v2-2b26beab-2178c0f3.js} +1 -1
rasa/core/channels/inspector/dist/assets/{styles-080da4f6-564d890e.js → styles-080da4f6-23ffa4fc.js} +1 -1
rasa/core/channels/inspector/dist/assets/{styles-3dcbcfbf-38957613.js → styles-3dcbcfbf-94f59763.js} +1 -1
rasa/core/channels/inspector/dist/assets/{styles-9c745c82-f0fc6921.js → styles-9c745c82-78a6bebc.js} +1 -1
rasa/core/channels/inspector/dist/assets/{svgDrawCommon-4835440b-ef3c5a77.js → svgDrawCommon-4835440b-eae2a6f6.js} +1 -1
rasa/core/channels/inspector/dist/assets/{timeline-definition-5b62e21b-bf3e91c1.js → timeline-definition-5b62e21b-5c968d92.js} +1 -1
rasa/core/channels/inspector/dist/assets/{xychartDiagram-2b33534f-4d4026c0.js → xychartDiagram-2b33534f-fd3db0d5.js} +1 -1
rasa/core/channels/inspector/dist/index.html +18 -17
rasa/core/channels/inspector/index.html +17 -16
rasa/core/channels/inspector/package.json +5 -1
rasa/core/channels/inspector/src/App.tsx +118 -68
rasa/core/channels/inspector/src/components/Chat.tsx +95 -0
rasa/core/channels/inspector/src/components/DiagramFlow.tsx +11 -10
rasa/core/channels/inspector/src/components/DialogueStack.tsx +10 -25
rasa/core/channels/inspector/src/components/LoadingSpinner.tsx +6 -3
rasa/core/channels/inspector/src/helpers/audiostream.ts +165 -0
rasa/core/channels/inspector/src/helpers/formatters.test.ts +10 -0
rasa/core/channels/inspector/src/helpers/formatters.ts +107 -41
rasa/core/channels/inspector/src/helpers/utils.ts +92 -7
rasa/core/channels/inspector/src/types.ts +21 -1
rasa/core/channels/inspector/yarn.lock +94 -1
rasa/core/channels/rest.py +51 -46
rasa/core/channels/socketio.py +28 -1
rasa/core/channels/telegram.py +1 -1
rasa/core/channels/twilio.py +1 -1
rasa/core/channels/{audiocodes.py → voice_ready/audiocodes.py} +122 -69
rasa/core/channels/{voice_aware → voice_ready}/jambonz.py +26 -8
rasa/core/channels/{voice_aware → voice_ready}/jambonz_protocol.py +57 -5
rasa/core/channels/{twilio_voice.py → voice_ready/twilio_voice.py} +64 -28
rasa/core/channels/voice_ready/utils.py +37 -0
rasa/core/channels/voice_stream/asr/__init__.py +0 -0
rasa/core/channels/voice_stream/asr/asr_engine.py +89 -0
rasa/core/channels/voice_stream/asr/asr_event.py +18 -0
rasa/core/channels/voice_stream/asr/azure.py +129 -0
rasa/core/channels/voice_stream/asr/deepgram.py +90 -0
rasa/core/channels/voice_stream/audio_bytes.py +8 -0
rasa/core/channels/voice_stream/browser_audio.py +107 -0
rasa/core/channels/voice_stream/call_state.py +23 -0
rasa/core/channels/voice_stream/tts/__init__.py +0 -0
rasa/core/channels/voice_stream/tts/azure.py +106 -0
rasa/core/channels/voice_stream/tts/cartesia.py +118 -0
rasa/core/channels/voice_stream/tts/tts_cache.py +27 -0
rasa/core/channels/voice_stream/tts/tts_engine.py +58 -0
rasa/core/channels/voice_stream/twilio_media_streams.py +173 -0
rasa/core/channels/voice_stream/util.py +57 -0
rasa/core/channels/voice_stream/voice_channel.py +427 -0
rasa/core/information_retrieval/qdrant.py +1 -0
rasa/core/nlg/contextual_response_rephraser.py +45 -17
rasa/{nlu → core}/persistor.py +203 -68
rasa/core/policies/enterprise_search_policy.py +119 -63
rasa/core/policies/flows/flow_executor.py +15 -22
rasa/core/policies/intentless_policy.py +83 -28
rasa/core/processor.py +25 -0
rasa/core/run.py +12 -2
rasa/core/secrets_manager/constants.py +4 -0
rasa/core/secrets_manager/factory.py +8 -0
rasa/core/secrets_manager/vault.py +11 -1
rasa/core/training/interactive.py +33 -34
rasa/core/utils.py +47 -21
rasa/dialogue_understanding/coexistence/llm_based_router.py +41 -14
rasa/dialogue_understanding/commands/__init__.py +6 -0
rasa/dialogue_understanding/commands/repeat_bot_messages_command.py +60 -0
rasa/dialogue_understanding/commands/session_end_command.py +61 -0
rasa/dialogue_understanding/commands/user_silence_command.py +59 -0
rasa/dialogue_understanding/commands/utils.py +5 -0
rasa/dialogue_understanding/generator/constants.py +2 -0
rasa/dialogue_understanding/generator/flow_retrieval.py +47 -9
rasa/dialogue_understanding/generator/llm_based_command_generator.py +38 -15
rasa/dialogue_understanding/generator/llm_command_generator.py +1 -1
rasa/dialogue_understanding/generator/multi_step/multi_step_llm_command_generator.py +35 -13
rasa/dialogue_understanding/generator/single_step/command_prompt_template.jinja2 +3 -0
rasa/dialogue_understanding/generator/single_step/single_step_llm_command_generator.py +60 -13
rasa/dialogue_understanding/patterns/default_flows_for_patterns.yml +53 -0
rasa/dialogue_understanding/patterns/repeat.py +37 -0
rasa/dialogue_understanding/patterns/user_silence.py +37 -0
rasa/dialogue_understanding/processor/command_processor.py +21 -1
rasa/e2e_test/aggregate_test_stats_calculator.py +1 -11
rasa/e2e_test/assertions.py +136 -61
rasa/e2e_test/assertions_schema.yml +23 -0
rasa/e2e_test/e2e_test_case.py +85 -6
rasa/e2e_test/e2e_test_runner.py +2 -3
rasa/e2e_test/utils/e2e_yaml_utils.py +1 -1
rasa/engine/graph.py +3 -10
rasa/engine/loader.py +12 -0
rasa/engine/recipes/config_files/default_config.yml +0 -3
rasa/engine/recipes/default_recipe.py +0 -1
rasa/engine/recipes/graph_recipe.py +0 -1
rasa/engine/runner/dask.py +2 -2
rasa/engine/storage/local_model_storage.py +12 -42
rasa/engine/storage/storage.py +1 -5
rasa/engine/validation.py +527 -74
rasa/model_manager/__init__.py +0 -0
rasa/model_manager/config.py +40 -0
rasa/model_manager/model_api.py +559 -0
rasa/model_manager/runner_service.py +286 -0
rasa/model_manager/socket_bridge.py +146 -0
rasa/model_manager/studio_jwt_auth.py +86 -0
rasa/model_manager/trainer_service.py +325 -0
rasa/model_manager/utils.py +87 -0
rasa/model_manager/warm_rasa_process.py +187 -0
rasa/model_service.py +112 -0
rasa/model_training.py +42 -23
rasa/nlu/tokenizers/whitespace_tokenizer.py +3 -14
rasa/server.py +4 -2
rasa/shared/constants.py +60 -8
rasa/shared/core/constants.py +13 -0
rasa/shared/core/domain.py +107 -50
rasa/shared/core/events.py +29 -0
rasa/shared/core/flows/flow.py +5 -0
rasa/shared/core/flows/flows_list.py +19 -6
rasa/shared/core/flows/flows_yaml_schema.json +10 -0
rasa/shared/core/flows/utils.py +39 -0
rasa/shared/core/flows/validation.py +121 -0
rasa/shared/core/flows/yaml_flows_io.py +15 -27
rasa/shared/core/slots.py +5 -0
rasa/shared/importers/importer.py +59 -41
rasa/shared/importers/multi_project.py +23 -11
rasa/shared/importers/rasa.py +12 -3
rasa/shared/importers/remote_importer.py +196 -0
rasa/shared/importers/utils.py +3 -1
rasa/shared/nlu/training_data/formats/rasa_yaml.py +18 -3
rasa/shared/nlu/training_data/training_data.py +18 -19
rasa/shared/providers/_configs/litellm_router_client_config.py +220 -0
rasa/shared/providers/_configs/model_group_config.py +167 -0
rasa/shared/providers/_configs/openai_client_config.py +1 -1
rasa/shared/providers/_configs/rasa_llm_client_config.py +73 -0
rasa/shared/providers/_configs/self_hosted_llm_client_config.py +1 -0
rasa/shared/providers/_configs/utils.py +16 -0
rasa/shared/providers/_utils.py +79 -0
rasa/shared/providers/embedding/_base_litellm_embedding_client.py +13 -29
rasa/shared/providers/embedding/azure_openai_embedding_client.py +54 -21
rasa/shared/providers/embedding/default_litellm_embedding_client.py +24 -0
rasa/shared/providers/embedding/litellm_router_embedding_client.py +135 -0
rasa/shared/providers/llm/_base_litellm_client.py +34 -22
rasa/shared/providers/llm/azure_openai_llm_client.py +50 -29
rasa/shared/providers/llm/default_litellm_llm_client.py +24 -0
rasa/shared/providers/llm/litellm_router_llm_client.py +182 -0
rasa/shared/providers/llm/rasa_llm_client.py +112 -0
rasa/shared/providers/llm/self_hosted_llm_client.py +5 -29
rasa/shared/providers/mappings.py +19 -0
rasa/shared/providers/router/__init__.py +0 -0
rasa/shared/providers/router/_base_litellm_router_client.py +183 -0
rasa/shared/providers/router/router_client.py +73 -0
rasa/shared/utils/common.py +40 -24
rasa/shared/utils/health_check/__init__.py +0 -0
rasa/shared/utils/health_check/embeddings_health_check_mixin.py +31 -0
rasa/shared/utils/health_check/health_check.py +258 -0
rasa/shared/utils/health_check/llm_health_check_mixin.py +31 -0
rasa/shared/utils/io.py +27 -6
rasa/shared/utils/llm.py +354 -44
rasa/shared/utils/schemas/events.py +2 -0
rasa/shared/utils/schemas/model_config.yml +0 -10
rasa/shared/utils/yaml.py +181 -38
rasa/studio/data_handler.py +3 -1
rasa/studio/upload.py +160 -74
rasa/telemetry.py +94 -17
rasa/tracing/config.py +3 -1
rasa/tracing/instrumentation/attribute_extractors.py +95 -18
rasa/tracing/instrumentation/instrumentation.py +121 -0
rasa/utils/common.py +5 -0
rasa/utils/endpoints.py +27 -1
rasa/utils/io.py +8 -16
rasa/utils/log_utils.py +9 -2
rasa/utils/sanic_error_handler.py +32 -0
rasa/validator.py +110 -16
rasa/version.py +1 -1
{rasa_pro-3.10.16.dist-info → rasa_pro-3.11.0.dist-info}/METADATA +16 -14
{rasa_pro-3.10.16.dist-info → rasa_pro-3.11.0.dist-info}/RECORD +236 -185
rasa/core/channels/inspector/dist/assets/flowDiagram-v2-855bc5b3-1844e5a5.js +0 -1
rasa/core/channels/inspector/dist/assets/index-a5d3e69d.js +0 -1040
rasa/core/channels/voice_aware/utils.py +0 -20
rasa/llm_fine_tuning/notebooks/unsloth_finetuning.ipynb +0 -407
/rasa/core/channels/{voice_aware → voice_ready}/__init__.py +0 -0
/rasa/core/channels/{voice_native → voice_stream}/__init__.py +0 -0
{rasa_pro-3.10.16.dist-info → rasa_pro-3.11.0.dist-info}/NOTICE +0 -0
{rasa_pro-3.10.16.dist-info → rasa_pro-3.11.0.dist-info}/WHEEL +0 -0
{rasa_pro-3.10.16.dist-info → rasa_pro-3.11.0.dist-info}/entry_points.txt +0 -0

rasa/shared/providers/embedding/litellm_router_embedding_client.py ADDED Viewed

@@ -0,0 +1,135 @@
+from typing import Any, Dict, List
+import logging
+import structlog
+from rasa.shared.exceptions import ProviderClientAPIException
+from rasa.shared.providers._configs.litellm_router_client_config import (
+    LiteLLMRouterClientConfig,
+)
+from rasa.shared.providers.embedding._base_litellm_embedding_client import (
+    _BaseLiteLLMEmbeddingClient,
+)
+from rasa.shared.providers.embedding.embedding_response import EmbeddingResponse
+from rasa.shared.providers.router._base_litellm_router_client import (
+    _BaseLiteLLMRouterClient,
+)
+from rasa.shared.utils.io import suppress_logs
+structlogger = structlog.get_logger()
+class LiteLLMRouterEmbeddingClient(
+    _BaseLiteLLMRouterClient, _BaseLiteLLMEmbeddingClient
+):
+    """A client for interfacing with LiteLLM Router Embedding endpoints.
+    Parameters:
+        model_group_id (str): The model group ID.
+        model_configurations (List[Dict[str, Any]]): The list of model configurations.
+        router_settings (Dict[str, Any]): The router settings.
+        kwargs (Optional[Dict[str, Any]]): Additional configuration parameters.
+    Raises:
+        ProviderClientValidationError: If validation of the client setup fails.
+    """
+    def __init__(
+        self,
+        model_group_id: str,
+        model_configurations: List[Dict[str, Any]],
+        router_settings: Dict[str, Any],
+        **kwargs: Any,
+    ):
+        super().__init__(
+            model_group_id, model_configurations, router_settings, **kwargs
+        )
+    @classmethod
+    def from_config(cls, config: Dict[str, Any]) -> "LiteLLMRouterEmbeddingClient":
+        """Instantiates a LiteLLM Router Embedding client from a configuration dict.
+        Args:
+            config: (Dict[str, Any]) The configuration dictionary.
+        Returns:
+            LiteLLMRouterLLMClient: The instantiated LiteLLM Router LLM client.
+        Raises:
+            ValueError: If the configuration is invalid.
+        """
+        try:
+            client_config = LiteLLMRouterClientConfig.from_dict(config)
+        except (KeyError, ValueError) as e:
+            message = "Cannot instantiate a client from the passed configuration."
+            structlogger.error(
+                "litellm_router_llm_client.from_config.error",
+                message=message,
+                config=config,
+                original_error=e,
+            )
+            raise
+        return cls(
+            model_group_id=client_config.model_group_id,
+            model_configurations=client_config.litellm_model_list,
+            router_settings=client_config.litellm_router_settings,
+            **client_config.extra_parameters,
+        )
+    @suppress_logs(log_level=logging.WARNING)
+    def embed(self, documents: List[str]) -> EmbeddingResponse:
+        """
+        Embeds a list of documents synchronously.
+        Args:
+            documents: List of documents to be embedded.
+        Returns:
+            List of embedding vectors.
+        Raises:
+            ProviderClientAPIException: If API calls raised an error.
+        """
+        self.validate_documents(documents)
+        try:
+            response = self.router_client.embedding(
+                input=documents, **self._embedding_fn_args
+            )
+            return self._format_response(response)
+        except Exception as e:
+            raise ProviderClientAPIException(
+                message="Failed to embed documents", original_exception=e
+            )
+    @suppress_logs(log_level=logging.WARNING)
+    async def aembed(self, documents: List[str]) -> EmbeddingResponse:
+        """
+        Embeds a list of documents asynchronously.
+        Args:
+            documents: List of documents to be embedded.
+        Returns:
+            List of embedding vectors.
+        Raises:
+            ProviderClientAPIException: If API calls raised an error.
+        """
+        self.validate_documents(documents)
+        try:
+            response = await self.router_client.aembedding(
+                input=documents, **self._embedding_fn_args
+            )
+            return self._format_response(response)
+        except Exception as e:
+            raise ProviderClientAPIException(
+                message="Failed to embed documents", original_exception=e
+            )
+    @property
+    def _embedding_fn_args(self) -> Dict[str, Any]:
+        """Returns the arguments to be passed to the embedding function."""
+        return {
+            **self._litellm_extra_parameters,
+            "model": self._model_group_id,
+        }

rasa/shared/providers/llm/_base_litellm_client.py CHANGED Viewed

@@ -1,6 +1,6 @@
+import logging
 from abc import abstractmethod
 from typing import Dict, List, Any, Union
-import logging
 import structlog
 from litellm import (
@@ -9,7 +9,7 @@ from litellm import (
     validate_environment,
 )
-from rasa.shared.constants import API_BASE_CONFIG_KEY
+from rasa.shared.constants import API_BASE_CONFIG_KEY, API_KEY
 from rasa.shared.exceptions import (
     ProviderClientAPIException,
     ProviderClientValidationError,
@@ -19,7 +19,7 @@ from rasa.shared.providers._ssl_verification_utils import (
     ensure_ssl_certificates_for_litellm_openai_based_clients,
 )
 from rasa.shared.providers.llm.llm_response import LLMResponse, LLMUsage
-from rasa.shared.utils.io import suppress_logs
+from rasa.shared.utils.io import suppress_logs, resolve_environment_variables
 structlogger = structlog.get_logger()
@@ -99,12 +99,12 @@ class _BaseLiteLLMClient:
             ProviderClientValidationError if validation fails.
         """
         self._validate_environment_variables()
-        self._validate_api_key_not_in_config()
     def _validate_environment_variables(self) -> None:
         """Validate that the required environment variables are set."""
         validation_info = validate_environment(
             self._litellm_model_name,
+            api_key=self._litellm_extra_parameters.get(API_KEY),
             api_base=self._litellm_extra_parameters.get(API_BASE_CONFIG_KEY),
         )
         if missing_environment_variables := validation_info.get(
@@ -121,18 +121,6 @@ class _BaseLiteLLMClient:
             )
             raise ProviderClientValidationError(event_info)
-    def _validate_api_key_not_in_config(self) -> None:
-        if "api_key" in self._litellm_extra_parameters:
-            event_info = (
-                "API Key is set through `api_key` extra parameter."
-                "Set API keys through environment variables."
-            )
-            structlogger.error(
-                "base_litellm_client.validate_api_key_not_in_config",
-                event_info=event_info,
-            )
-            raise ProviderClientValidationError(event_info)
     @suppress_logs(log_level=logging.WARNING)
     def completion(self, messages: Union[List[str], str]) -> LLMResponse:
         """Synchronously generate completions for given list of messages.
@@ -149,9 +137,8 @@ class _BaseLiteLLMClient:
         """
         try:
             formatted_messages = self._format_messages(messages)
-            response = completion(
-                messages=formatted_messages, **self._completion_fn_args
-            )
+            arguments = resolve_environment_variables(self._completion_fn_args)
+            response = completion(messages=formatted_messages, **arguments)
             return self._format_response(response)
         except Exception as e:
             raise ProviderClientAPIException(e)
@@ -172,9 +159,8 @@ class _BaseLiteLLMClient:
         """
         try:
             formatted_messages = self._format_messages(messages)
-            response = await acompletion(
-                messages=formatted_messages, **self._completion_fn_args
-            )
+            arguments = resolve_environment_variables(self._completion_fn_args)
+            response = await acompletion(messages=formatted_messages, **arguments)
             return self._format_response(response)
         except Exception as e:
             message = ""
@@ -235,6 +221,32 @@ class _BaseLiteLLMClient:
         )
         return formatted_response
+    def _format_text_completion_response(self, response: Any) -> LLMResponse:
+        """Parses the LiteLLM text completion response to Rasa format."""
+        formatted_response = LLMResponse(
+            id=response.id,
+            created=response.created,
+            choices=[choice.text for choice in response.choices],
+            model=response.model,
+        )
+        if (usage := response.usage) is not None:
+            prompt_tokens = (
+                num_tokens
+                if isinstance(num_tokens := usage.prompt_tokens, (int, float))
+                else 0
+            )
+            completion_tokens = (
+                num_tokens
+                if isinstance(num_tokens := usage.completion_tokens, (int, float))
+                else 0
+            )
+            formatted_response.usage = LLMUsage(prompt_tokens, completion_tokens)
+        structlogger.debug(
+            "base_litellm_client.formatted_response",
+            formatted_response=formatted_response.to_dict(),
+        )
+        return formatted_response
     @staticmethod
     def _ensure_certificates() -> None:
         """Configures SSL certificates for LiteLLM. This method is invoked during

rasa/shared/providers/llm/azure_openai_llm_client.py CHANGED Viewed

@@ -17,6 +17,7 @@ from rasa.shared.constants import (
     OPENAI_API_KEY_ENV_VAR,
     AZURE_API_TYPE_ENV_VAR,
     AZURE_OPENAI_PROVIDER,
+    API_KEY,
 )
 from rasa.shared.exceptions import ProviderClientValidationError
 from rasa.shared.providers._configs.azure_openai_client_config import (
@@ -29,8 +30,7 @@ structlogger = structlog.get_logger()
 class AzureOpenAILLMClient(_BaseLiteLLMClient):
-    """
-    A client for interfacing with Azure's OpenAI LLM deployments.
+    """A client for interfacing with Azure's OpenAI LLM deployments.
     Parameters:
         deployment (str): The deployment name.
@@ -80,11 +80,7 @@ class AzureOpenAILLMClient(_BaseLiteLLMClient):
             or os.getenv(OPENAI_API_VERSION_ENV_VAR)
         )
-        # API key can be set through OPENAI_API_KEY too,
-        # because of the backward compatibility
-        self._api_key = os.getenv(AZURE_API_KEY_ENV_VAR) or os.getenv(
-            OPENAI_API_KEY_ENV_VAR
-        )
+        self._api_key_env_var = self._resolve_api_key_env_var()
         # Not used by LiteLLM, here for backward compatibility
         self._api_type = (
@@ -117,11 +113,6 @@ class AzureOpenAILLMClient(_BaseLiteLLMClient):
                 "env_var": AZURE_API_VERSION_ENV_VAR,
                 "deprecated_var": OPENAI_API_VERSION_ENV_VAR,
             },
-            "API Key": {
-                "current_value": self._api_key,
-                "env_var": AZURE_API_KEY_ENV_VAR,
-                "deprecated_var": OPENAI_API_KEY_ENV_VAR,
-            },
         }
         deprecation_warning_message = (
@@ -154,10 +145,51 @@ class AzureOpenAILLMClient(_BaseLiteLLMClient):
                     )
                 raise_deprecation_warning(message=message)
+    def _resolve_api_key_env_var(self) -> str:
+        """Resolves the environment variable to use for the API key.
+        Returns:
+            str: The env variable in dollar syntax format to use for the API key.
+        """
+        if API_KEY in self._extra_parameters:
+            # API key is set to an env var in the config itself
+            # in case the model is defined in the endpoints.yml
+            return self._extra_parameters[API_KEY]
+        if os.getenv(AZURE_API_KEY_ENV_VAR) is not None:
+            return "${AZURE_API_KEY}"
+        if os.getenv(OPENAI_API_KEY_ENV_VAR) is not None:
+            # API key can be set through OPENAI_API_KEY too,
+            # because of the backward compatibility
+            raise_deprecation_warning(
+                message=(
+                    f"Usage of '{OPENAI_API_KEY_ENV_VAR}' environment variable "
+                    "for setting the API key for Azure OpenAI "
+                    "client is deprecated and will be removed "
+                    f"in 4.0.0. Please use '{AZURE_API_KEY_ENV_VAR}' "
+                    "environment variable."
+                )
+            )
+            return "${OPENAI_API_KEY}"
+        structlogger.error(
+            "azure_openai_llm_client.api_key_not_set",
+            event_info=(
+                "API key not set, it is required for API calls. "
+                f"Set it either via the environment variable"
+                f"'{AZURE_API_KEY_ENV_VAR}' or directly"
+                f"via the config key '{API_KEY}'."
+            ),
+        )
+        raise ProviderClientValidationError(
+            f"Missing required environment variable/config key '{API_KEY}' for "
+            f"API calls."
+        )
     @classmethod
     def from_config(cls, config: Dict[str, Any]) -> "AzureOpenAILLMClient":
-        """
-        Initializes the client from given configuration.
+        """Initializes the client from given configuration.
         Args:
             config (Dict[str, Any]): Configuration.
@@ -212,23 +244,17 @@ class AzureOpenAILLMClient(_BaseLiteLLMClient):
     @property
     def model(self) -> Optional[str]:
-        """
-        Returns the name of the model deployed on Azure.
-        """
+        """Returns the name of the model deployed on Azure."""
         return self._model
     @property
     def api_base(self) -> Optional[str]:
-        """
-        Returns the API base URL for the Azure OpenAI llm client.
-        """
+        """Returns the API base URL for the Azure OpenAI llm client."""
         return self._api_base
     @property
     def api_version(self) -> Optional[str]:
-        """
-        Returns the API version for the Azure OpenAI llm client.
-        """
+        """Returns the API version for the Azure OpenAI llm client."""
         return self._api_version
     @property
@@ -261,7 +287,7 @@ class AzureOpenAILLMClient(_BaseLiteLLMClient):
             {
                 "api_base": self.api_base,
                 "api_version": self.api_version,
-                "api_key": self._api_key,
+                "api_key": self._api_key_env_var,
             }
         )
         return fn_args
@@ -305,11 +331,6 @@ class AzureOpenAILLMClient(_BaseLiteLLMClient):
                 "env_var": None,
                 "config_key": DEPLOYMENT_CONFIG_KEY,
             },
-            "API Key": {
-                "current_value": self._api_key,
-                "env_var": AZURE_API_KEY_ENV_VAR,
-                "config_key": None,
-            },
         }
         missing_settings = [

rasa/shared/providers/llm/default_litellm_llm_client.py CHANGED Viewed

@@ -1,8 +1,13 @@
 from typing import Dict, Any
+from rasa.shared.constants import (
+    AWS_BEDROCK_PROVIDER,
+    AWS_SAGEMAKER_PROVIDER,
+)
 from rasa.shared.providers._configs.default_litellm_client_config import (
     DefaultLiteLLMClientConfig,
 )
+from rasa.shared.providers._utils import validate_aws_setup_for_litellm_clients
 from rasa.shared.providers.llm._base_litellm_client import _BaseLiteLLMClient
@@ -82,3 +87,22 @@ class DefaultLiteLLMClient(_BaseLiteLLMClient):
         to the client provider and deployed model.
         """
         return self._extra_parameters
+    def validate_client_setup(self) -> None:
+        # TODO: Temporarily change the environment variable validation for AWS setup
+        #       (Bedrock and SageMaker) until resolved by either:
+        #       1. An update from the LiteLLM package addressing the issue.
+        #       2. The implementation of a Bedrock client on our end.
+        #       ---
+        #       This fix ensures a consistent user experience for Bedrock (and
+        #       SageMaker) in Rasa by allowing AWS secrets to be provided as extra
+        #       parameters without triggering validation errors due to missing AWS
+        #       environment variables.
+        if self.provider.lower() in [AWS_BEDROCK_PROVIDER, AWS_SAGEMAKER_PROVIDER]:
+            validate_aws_setup_for_litellm_clients(
+                self._litellm_model_name,
+                self._litellm_extra_parameters,
+                "default_litellm_llm_client",
+            )
+        else:
+            super().validate_client_setup()

rasa/shared/providers/llm/litellm_router_llm_client.py ADDED Viewed

@@ -0,0 +1,182 @@
+from typing import Any, Dict, List, Union
+import logging
+import structlog
+from rasa.shared.exceptions import ProviderClientAPIException
+from rasa.shared.providers._configs.litellm_router_client_config import (
+    LiteLLMRouterClientConfig,
+)
+from rasa.shared.providers.llm._base_litellm_client import _BaseLiteLLMClient
+from rasa.shared.providers.llm.llm_response import LLMResponse
+from rasa.shared.providers.router._base_litellm_router_client import (
+    _BaseLiteLLMRouterClient,
+)
+from rasa.shared.utils.io import suppress_logs
+structlogger = structlog.get_logger()
+class LiteLLMRouterLLMClient(_BaseLiteLLMRouterClient, _BaseLiteLLMClient):
+    """A client for interfacing with LiteLLM Router LLM endpoints.
+    Parameters:
+        model_group_id (str): The model group ID.
+        model_configurations (List[Dict[str, Any]]): The list of model configurations.
+        router_settings (Dict[str, Any]): The router settings.
+        kwargs (Optional[Dict[str, Any]]): Additional configuration parameters.
+    Raises:
+        ProviderClientValidationError: If validation of the client setup fails.
+    """
+    def __init__(
+        self,
+        model_group_id: str,
+        model_configurations: List[Dict[str, Any]],
+        router_settings: Dict[str, Any],
+        **kwargs: Any,
+    ):
+        super().__init__(
+            model_group_id, model_configurations, router_settings, **kwargs
+        )
+    @classmethod
+    def from_config(cls, config: Dict[str, Any]) -> "LiteLLMRouterLLMClient":
+        """Instantiates a LiteLLM Router LLM client from a configuration dict.
+        Args:
+            config: (Dict[str, Any]) The configuration dictionary.
+        Returns:
+            LiteLLMRouterLLMClient: The instantiated LiteLLM Router LLM client.
+        Raises:
+            ValueError: If the configuration is invalid.
+        """
+        try:
+            client_config = LiteLLMRouterClientConfig.from_dict(config)
+        except (KeyError, ValueError) as e:
+            message = "Cannot instantiate a client from the passed configuration."
+            structlogger.error(
+                "litellm_router_llm_client.from_config.error",
+                message=message,
+                config=config,
+                original_error=e,
+            )
+            raise
+        return cls(
+            model_group_id=client_config.model_group_id,
+            model_configurations=client_config.litellm_model_list,
+            router_settings=client_config.litellm_router_settings,
+            use_chat_completions_endpoint=client_config.use_chat_completions_endpoint,
+            **client_config.extra_parameters,
+        )
+    @suppress_logs(log_level=logging.WARNING)
+    def _text_completion(self, prompt: Union[List[str], str]) -> LLMResponse:
+        """
+        Synchronously generate completions for given prompt.
+        Args:
+            prompt: Prompt to generate the completion for.
+        Returns:
+            List of message completions.
+        Raises:
+            ProviderClientAPIException: If the API request fails.
+        """
+        try:
+            response = self.router_client.text_completion(
+                prompt=prompt, **self._completion_fn_args
+            )
+            return self._format_text_completion_response(response)
+        except Exception as e:
+            raise ProviderClientAPIException(e)
+    @suppress_logs(log_level=logging.WARNING)
+    async def _atext_completion(self, prompt: Union[List[str], str]) -> LLMResponse:
+        """
+        Asynchronously generate completions for given prompt.
+        Args:
+            prompt: Prompt to generate the completion for.
+        Returns:
+            List of message completions.
+        Raises:
+            ProviderClientAPIException: If the API request fails.
+        """
+        try:
+            response = await self.router_client.atext_completion(
+                prompt=prompt, **self._completion_fn_args
+            )
+            return self._format_text_completion_response(response)
+        except Exception as e:
+            raise ProviderClientAPIException(e)
+    @suppress_logs(log_level=logging.WARNING)
+    def completion(self, messages: Union[List[str], str]) -> LLMResponse:
+        """
+        Synchronously generate completions for given list of messages.
+        Method overrides the base class method to call the appropriate
+        completion method based on the configuration. If the chat completions
+        endpoint is enabled, the completion method is called. Otherwise, the
+        text_completion method is called.
+        Args:
+            messages: List of messages or a single message to generate the
+                completion for.
+        Returns:
+            List of message completions.
+        Raises:
+            ProviderClientAPIException: If the API request fails.
+        """
+        if not self._use_chat_completions_endpoint:
+            return self._text_completion(messages)
+        try:
+            formatted_messages = self._format_messages(messages)
+            response = self.router_client.completion(
+                messages=formatted_messages, **self._completion_fn_args
+            )
+            return self._format_response(response)
+        except Exception as e:
+            raise ProviderClientAPIException(e)
+    @suppress_logs(log_level=logging.WARNING)
+    async def acompletion(self, messages: Union[List[str], str]) -> LLMResponse:
+        """
+        Asynchronously generate completions for given list of messages.
+        Method overrides the base class method to call the appropriate
+        completion method based on the configuration. If the chat completions
+        endpoint is enabled, the completion method is called. Otherwise, the
+        text_completion method is called.
+        Args:
+            messages: List of messages or a single message to generate the
+                completion for.
+        Returns:
+            List of message completions.
+        Raises:
+            ProviderClientAPIException: If the API request fails.
+        """
+        if not self._use_chat_completions_endpoint:
+            return await self._atext_completion(messages)
+        try:
+            formatted_messages = self._format_messages(messages)
+            response = await self.router_client.acompletion(
+                messages=formatted_messages, **self._completion_fn_args
+            )
+            return self._format_response(response)
+        except Exception as e:
+            raise ProviderClientAPIException(e)
+    @property
+    def _completion_fn_args(self) -> Dict[str, Any]:
+        """Returns the completion arguments for invoking a call through
+        LiteLLM's completion functions.
+        """
+        return {
+            **self._litellm_extra_parameters,
+            "model": self.model_group_id,
+        }

rasa-pro 3.10.16__py3-none-any.whl → 3.11.0__py3-none-any.whl

Potentially problematic release.

rasa-pro 3.10.16py3-none-any.whl → 3.11.0py3-none-any.whl