PyPI - rasa-pro - Versions diffs - 3.10.15__py3-none-any.whl → 3.11.0__py3-none-any.whl - Mend

rasa-pro 3.10.15py3-none-any.whl → 3.11.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of rasa-pro might be problematic. Click here for more details.

Files changed (238) hide show

rasa/__main__.py +31 -15
rasa/api.py +12 -2
rasa/cli/arguments/default_arguments.py +24 -4
rasa/cli/arguments/run.py +15 -0
rasa/cli/arguments/shell.py +5 -1
rasa/cli/arguments/train.py +17 -9
rasa/cli/evaluate.py +7 -7
rasa/cli/inspect.py +19 -7
rasa/cli/interactive.py +1 -0
rasa/cli/project_templates/calm/config.yml +5 -7
rasa/cli/project_templates/calm/endpoints.yml +15 -2
rasa/cli/project_templates/tutorial/config.yml +8 -5
rasa/cli/project_templates/tutorial/data/flows.yml +1 -1
rasa/cli/project_templates/tutorial/data/patterns.yml +5 -0
rasa/cli/project_templates/tutorial/domain.yml +14 -0
rasa/cli/project_templates/tutorial/endpoints.yml +5 -0
rasa/cli/run.py +7 -0
rasa/cli/scaffold.py +4 -2
rasa/cli/studio/upload.py +0 -15
rasa/cli/train.py +14 -53
rasa/cli/utils.py +14 -11
rasa/cli/x.py +7 -7
rasa/constants.py +3 -1
rasa/core/actions/action.py +77 -33
rasa/core/actions/action_hangup.py +29 -0
rasa/core/actions/action_repeat_bot_messages.py +89 -0
rasa/core/actions/e2e_stub_custom_action_executor.py +5 -1
rasa/core/actions/http_custom_action_executor.py +4 -0
rasa/core/agent.py +2 -2
rasa/core/brokers/kafka.py +3 -1
rasa/core/brokers/pika.py +3 -1
rasa/core/channels/__init__.py +10 -6
rasa/core/channels/channel.py +41 -4
rasa/core/channels/development_inspector.py +150 -46
rasa/core/channels/inspector/README.md +1 -1
rasa/core/channels/inspector/dist/assets/{arc-b6e548fe.js → arc-bc141fb2.js} +1 -1
rasa/core/channels/inspector/dist/assets/{c4Diagram-d0fbc5ce-fa03ac9e.js → c4Diagram-d0fbc5ce-be2db283.js} +1 -1
rasa/core/channels/inspector/dist/assets/{classDiagram-936ed81e-ee67392a.js → classDiagram-936ed81e-55366915.js} +1 -1
rasa/core/channels/inspector/dist/assets/{classDiagram-v2-c3cb15f1-9b283fae.js → classDiagram-v2-c3cb15f1-bb529518.js} +1 -1
rasa/core/channels/inspector/dist/assets/{createText-62fc7601-8b6fcc2a.js → createText-62fc7601-b0ec81d6.js} +1 -1
rasa/core/channels/inspector/dist/assets/{edges-f2ad444c-22e77f4f.js → edges-f2ad444c-6166330c.js} +1 -1
rasa/core/channels/inspector/dist/assets/{erDiagram-9d236eb7-60ffc87f.js → erDiagram-9d236eb7-5ccc6a8e.js} +1 -1
rasa/core/channels/inspector/dist/assets/{flowDb-1972c806-9dd802e4.js → flowDb-1972c806-fca3bfe4.js} +1 -1
rasa/core/channels/inspector/dist/assets/{flowDiagram-7ea5b25a-5fa1912f.js → flowDiagram-7ea5b25a-4739080f.js} +1 -1
rasa/core/channels/inspector/dist/assets/flowDiagram-v2-855bc5b3-736177bf.js +1 -0
rasa/core/channels/inspector/dist/assets/{flowchart-elk-definition-abe16c3d-622a1fd2.js → flowchart-elk-definition-abe16c3d-7c1b0e0f.js} +1 -1
rasa/core/channels/inspector/dist/assets/{ganttDiagram-9b5ea136-e285a63a.js → ganttDiagram-9b5ea136-772fd050.js} +1 -1
rasa/core/channels/inspector/dist/assets/{gitGraphDiagram-99d0ae7c-f237bdca.js → gitGraphDiagram-99d0ae7c-8eae1dc9.js} +1 -1
rasa/core/channels/inspector/dist/assets/{index-2c4b9a3b-4b03d70e.js → index-2c4b9a3b-f55afcdf.js} +1 -1
rasa/core/channels/inspector/dist/assets/index-e7cef9de.js +1317 -0
rasa/core/channels/inspector/dist/assets/{infoDiagram-736b4530-72a0fa5f.js → infoDiagram-736b4530-124d4a14.js} +1 -1
rasa/core/channels/inspector/dist/assets/{journeyDiagram-df861f2b-82218c41.js → journeyDiagram-df861f2b-7c4fae44.js} +1 -1
rasa/core/channels/inspector/dist/assets/{layout-78cff630.js → layout-b9885fb6.js} +1 -1
rasa/core/channels/inspector/dist/assets/{line-5038b469.js → line-7c59abb6.js} +1 -1
rasa/core/channels/inspector/dist/assets/{linear-c4fc4098.js → linear-4776f780.js} +1 -1
rasa/core/channels/inspector/dist/assets/{mindmap-definition-beec6740-c33c8ea6.js → mindmap-definition-beec6740-2332c46c.js} +1 -1
rasa/core/channels/inspector/dist/assets/{pieDiagram-dbbf0591-a8d03059.js → pieDiagram-dbbf0591-8fb39303.js} +1 -1
rasa/core/channels/inspector/dist/assets/{quadrantDiagram-4d7f4fd6-6a0e56b2.js → quadrantDiagram-4d7f4fd6-3c7180a2.js} +1 -1
rasa/core/channels/inspector/dist/assets/{requirementDiagram-6fc4c22a-2dc7c7bd.js → requirementDiagram-6fc4c22a-e910bcb8.js} +1 -1
rasa/core/channels/inspector/dist/assets/{sankeyDiagram-8f13d901-2360fe39.js → sankeyDiagram-8f13d901-ead16c89.js} +1 -1
rasa/core/channels/inspector/dist/assets/{sequenceDiagram-b655622a-41b9f9ad.js → sequenceDiagram-b655622a-29a02a19.js} +1 -1
rasa/core/channels/inspector/dist/assets/{stateDiagram-59f0c015-0aad326f.js → stateDiagram-59f0c015-042b3137.js} +1 -1
rasa/core/channels/inspector/dist/assets/{stateDiagram-v2-2b26beab-9847d984.js → stateDiagram-v2-2b26beab-2178c0f3.js} +1 -1
rasa/core/channels/inspector/dist/assets/{styles-080da4f6-564d890e.js → styles-080da4f6-23ffa4fc.js} +1 -1
rasa/core/channels/inspector/dist/assets/{styles-3dcbcfbf-38957613.js → styles-3dcbcfbf-94f59763.js} +1 -1
rasa/core/channels/inspector/dist/assets/{styles-9c745c82-f0fc6921.js → styles-9c745c82-78a6bebc.js} +1 -1
rasa/core/channels/inspector/dist/assets/{svgDrawCommon-4835440b-ef3c5a77.js → svgDrawCommon-4835440b-eae2a6f6.js} +1 -1
rasa/core/channels/inspector/dist/assets/{timeline-definition-5b62e21b-bf3e91c1.js → timeline-definition-5b62e21b-5c968d92.js} +1 -1
rasa/core/channels/inspector/dist/assets/{xychartDiagram-2b33534f-4d4026c0.js → xychartDiagram-2b33534f-fd3db0d5.js} +1 -1
rasa/core/channels/inspector/dist/index.html +18 -15
rasa/core/channels/inspector/index.html +17 -14
rasa/core/channels/inspector/package.json +5 -1
rasa/core/channels/inspector/src/App.tsx +118 -68
rasa/core/channels/inspector/src/components/Chat.tsx +95 -0
rasa/core/channels/inspector/src/components/DiagramFlow.tsx +11 -10
rasa/core/channels/inspector/src/components/DialogueStack.tsx +10 -25
rasa/core/channels/inspector/src/components/LoadingSpinner.tsx +6 -3
rasa/core/channels/inspector/src/helpers/audiostream.ts +165 -0
rasa/core/channels/inspector/src/helpers/formatters.test.ts +10 -0
rasa/core/channels/inspector/src/helpers/formatters.ts +107 -41
rasa/core/channels/inspector/src/helpers/utils.ts +92 -7
rasa/core/channels/inspector/src/types.ts +21 -1
rasa/core/channels/inspector/yarn.lock +94 -1
rasa/core/channels/rest.py +51 -46
rasa/core/channels/socketio.py +28 -1
rasa/core/channels/telegram.py +1 -1
rasa/core/channels/twilio.py +1 -1
rasa/core/channels/{audiocodes.py → voice_ready/audiocodes.py} +122 -69
rasa/core/channels/{voice_aware → voice_ready}/jambonz.py +26 -8
rasa/core/channels/{voice_aware → voice_ready}/jambonz_protocol.py +57 -5
rasa/core/channels/{twilio_voice.py → voice_ready/twilio_voice.py} +64 -28
rasa/core/channels/voice_ready/utils.py +37 -0
rasa/core/channels/voice_stream/asr/__init__.py +0 -0
rasa/core/channels/voice_stream/asr/asr_engine.py +89 -0
rasa/core/channels/voice_stream/asr/asr_event.py +18 -0
rasa/core/channels/voice_stream/asr/azure.py +129 -0
rasa/core/channels/voice_stream/asr/deepgram.py +90 -0
rasa/core/channels/voice_stream/audio_bytes.py +8 -0
rasa/core/channels/voice_stream/browser_audio.py +107 -0
rasa/core/channels/voice_stream/call_state.py +23 -0
rasa/core/channels/voice_stream/tts/__init__.py +0 -0
rasa/core/channels/voice_stream/tts/azure.py +106 -0
rasa/core/channels/voice_stream/tts/cartesia.py +118 -0
rasa/core/channels/voice_stream/tts/tts_cache.py +27 -0
rasa/core/channels/voice_stream/tts/tts_engine.py +58 -0
rasa/core/channels/voice_stream/twilio_media_streams.py +173 -0
rasa/core/channels/voice_stream/util.py +57 -0
rasa/core/channels/voice_stream/voice_channel.py +427 -0
rasa/core/information_retrieval/qdrant.py +1 -0
rasa/core/nlg/contextual_response_rephraser.py +45 -17
rasa/{nlu → core}/persistor.py +203 -68
rasa/core/policies/enterprise_search_policy.py +119 -63
rasa/core/policies/flows/flow_executor.py +15 -22
rasa/core/policies/intentless_policy.py +83 -28
rasa/core/processor.py +25 -0
rasa/core/run.py +12 -2
rasa/core/secrets_manager/constants.py +4 -0
rasa/core/secrets_manager/factory.py +8 -0
rasa/core/secrets_manager/vault.py +11 -1
rasa/core/training/interactive.py +33 -34
rasa/core/utils.py +47 -21
rasa/dialogue_understanding/coexistence/llm_based_router.py +41 -14
rasa/dialogue_understanding/commands/__init__.py +6 -0
rasa/dialogue_understanding/commands/repeat_bot_messages_command.py +60 -0
rasa/dialogue_understanding/commands/session_end_command.py +61 -0
rasa/dialogue_understanding/commands/user_silence_command.py +59 -0
rasa/dialogue_understanding/commands/utils.py +5 -0
rasa/dialogue_understanding/generator/constants.py +2 -0
rasa/dialogue_understanding/generator/flow_retrieval.py +47 -9
rasa/dialogue_understanding/generator/llm_based_command_generator.py +38 -15
rasa/dialogue_understanding/generator/llm_command_generator.py +1 -1
rasa/dialogue_understanding/generator/multi_step/multi_step_llm_command_generator.py +35 -13
rasa/dialogue_understanding/generator/single_step/command_prompt_template.jinja2 +3 -0
rasa/dialogue_understanding/generator/single_step/single_step_llm_command_generator.py +60 -13
rasa/dialogue_understanding/patterns/default_flows_for_patterns.yml +53 -0
rasa/dialogue_understanding/patterns/repeat.py +37 -0
rasa/dialogue_understanding/patterns/user_silence.py +37 -0
rasa/dialogue_understanding/processor/command_processor.py +21 -1
rasa/e2e_test/aggregate_test_stats_calculator.py +1 -11
rasa/e2e_test/assertions.py +136 -61
rasa/e2e_test/assertions_schema.yml +23 -0
rasa/e2e_test/e2e_test_case.py +85 -6
rasa/e2e_test/e2e_test_runner.py +2 -3
rasa/engine/graph.py +0 -1
rasa/engine/loader.py +12 -0
rasa/engine/recipes/config_files/default_config.yml +0 -3
rasa/engine/recipes/default_recipe.py +0 -1
rasa/engine/recipes/graph_recipe.py +0 -1
rasa/engine/runner/dask.py +2 -2
rasa/engine/storage/local_model_storage.py +12 -42
rasa/engine/storage/storage.py +1 -5
rasa/engine/validation.py +527 -74
rasa/model_manager/__init__.py +0 -0
rasa/model_manager/config.py +40 -0
rasa/model_manager/model_api.py +559 -0
rasa/model_manager/runner_service.py +286 -0
rasa/model_manager/socket_bridge.py +146 -0
rasa/model_manager/studio_jwt_auth.py +86 -0
rasa/model_manager/trainer_service.py +325 -0
rasa/model_manager/utils.py +87 -0
rasa/model_manager/warm_rasa_process.py +187 -0
rasa/model_service.py +112 -0
rasa/model_training.py +42 -23
rasa/nlu/tokenizers/whitespace_tokenizer.py +3 -14
rasa/server.py +4 -2
rasa/shared/constants.py +60 -8
rasa/shared/core/constants.py +13 -0
rasa/shared/core/domain.py +107 -50
rasa/shared/core/events.py +29 -0
rasa/shared/core/flows/flow.py +5 -0
rasa/shared/core/flows/flows_list.py +19 -6
rasa/shared/core/flows/flows_yaml_schema.json +10 -0
rasa/shared/core/flows/utils.py +39 -0
rasa/shared/core/flows/validation.py +121 -0
rasa/shared/core/flows/yaml_flows_io.py +15 -27
rasa/shared/core/slots.py +5 -0
rasa/shared/importers/importer.py +59 -41
rasa/shared/importers/multi_project.py +23 -11
rasa/shared/importers/rasa.py +12 -3
rasa/shared/importers/remote_importer.py +196 -0
rasa/shared/importers/utils.py +3 -1
rasa/shared/nlu/training_data/formats/rasa_yaml.py +18 -3
rasa/shared/nlu/training_data/training_data.py +18 -19
rasa/shared/providers/_configs/litellm_router_client_config.py +220 -0
rasa/shared/providers/_configs/model_group_config.py +167 -0
rasa/shared/providers/_configs/openai_client_config.py +1 -1
rasa/shared/providers/_configs/rasa_llm_client_config.py +73 -0
rasa/shared/providers/_configs/self_hosted_llm_client_config.py +1 -0
rasa/shared/providers/_configs/utils.py +16 -0
rasa/shared/providers/_utils.py +79 -0
rasa/shared/providers/embedding/_base_litellm_embedding_client.py +13 -29
rasa/shared/providers/embedding/azure_openai_embedding_client.py +54 -21
rasa/shared/providers/embedding/default_litellm_embedding_client.py +24 -0
rasa/shared/providers/embedding/litellm_router_embedding_client.py +135 -0
rasa/shared/providers/llm/_base_litellm_client.py +34 -22
rasa/shared/providers/llm/azure_openai_llm_client.py +50 -29
rasa/shared/providers/llm/default_litellm_llm_client.py +24 -0
rasa/shared/providers/llm/litellm_router_llm_client.py +182 -0
rasa/shared/providers/llm/rasa_llm_client.py +112 -0
rasa/shared/providers/llm/self_hosted_llm_client.py +5 -29
rasa/shared/providers/mappings.py +19 -0
rasa/shared/providers/router/__init__.py +0 -0
rasa/shared/providers/router/_base_litellm_router_client.py +183 -0
rasa/shared/providers/router/router_client.py +73 -0
rasa/shared/utils/common.py +40 -24
rasa/shared/utils/health_check/__init__.py +0 -0
rasa/shared/utils/health_check/embeddings_health_check_mixin.py +31 -0
rasa/shared/utils/health_check/health_check.py +258 -0
rasa/shared/utils/health_check/llm_health_check_mixin.py +31 -0
rasa/shared/utils/io.py +27 -6
rasa/shared/utils/llm.py +353 -43
rasa/shared/utils/schemas/events.py +2 -0
rasa/shared/utils/schemas/model_config.yml +0 -10
rasa/shared/utils/yaml.py +181 -38
rasa/studio/data_handler.py +3 -1
rasa/studio/upload.py +160 -74
rasa/telemetry.py +94 -17
rasa/tracing/config.py +3 -1
rasa/tracing/instrumentation/attribute_extractors.py +95 -18
rasa/tracing/instrumentation/instrumentation.py +121 -0
rasa/utils/common.py +5 -0
rasa/utils/endpoints.py +27 -1
rasa/utils/io.py +8 -16
rasa/utils/log_utils.py +9 -2
rasa/utils/sanic_error_handler.py +32 -0
rasa/validator.py +110 -4
rasa/version.py +1 -1
{rasa_pro-3.10.15.dist-info → rasa_pro-3.11.0.dist-info}/METADATA +14 -12
{rasa_pro-3.10.15.dist-info → rasa_pro-3.11.0.dist-info}/RECORD +234 -183
rasa/core/channels/inspector/dist/assets/flowDiagram-v2-855bc5b3-1844e5a5.js +0 -1
rasa/core/channels/inspector/dist/assets/index-a5d3e69d.js +0 -1040
rasa/core/channels/voice_aware/utils.py +0 -20
rasa/llm_fine_tuning/notebooks/unsloth_finetuning.ipynb +0 -407
/rasa/core/channels/{voice_aware → voice_ready}/__init__.py +0 -0
/rasa/core/channels/{voice_native → voice_stream}/__init__.py +0 -0
{rasa_pro-3.10.15.dist-info → rasa_pro-3.11.0.dist-info}/NOTICE +0 -0
{rasa_pro-3.10.15.dist-info → rasa_pro-3.11.0.dist-info}/WHEEL +0 -0
{rasa_pro-3.10.15.dist-info → rasa_pro-3.11.0.dist-info}/entry_points.txt +0 -0

rasa/core/channels/{twilio_voice.py → voice_ready/twilio_voice.py} RENAMED Viewed

@@ -1,9 +1,11 @@
 from sanic import Blueprint, response
-from sanic.request import Request
+from sanic.request import Request, RequestParameters
 from sanic.response import HTTPResponse
 from twilio.twiml.voice_response import VoiceResponse, Gather
 from typing import Text, Callable, Awaitable, List, Any, Dict, Optional
+from dataclasses import asdict
+import structlog
 import rasa.utils.io
 import rasa.shared.utils.io
 from rasa.shared.core.events import BotUttered
@@ -13,6 +15,19 @@ from rasa.core.channels.channel import (
     CollectingOutputChannel,
     UserMessage,
 )
+from rasa.core.channels.voice_ready.utils import CallParameters
+logger = structlog.get_logger(__name__)
+def map_call_params(form: RequestParameters) -> CallParameters:
+    """Map the Audiocodes parameters to the CallParameters dataclass."""
+    return CallParameters(
+        call_id=form.get("CallSid"),
+        user_phone=form.get("Caller"),
+        bot_phone=form.get("Called"),
+        direction=form.get("Direction"),
+    )
 class TwilioVoiceInput(InputChannel):
@@ -105,7 +120,6 @@ class TwilioVoiceInput(InputChannel):
         credentials = credentials or {}
         return cls(
-            credentials.get("initial_prompt", "hello"),
             credentials.get(
                 "reprompt_fallback_phrase",
                 "I'm sorry I didn't get that could you rephrase.",
@@ -118,7 +132,6 @@ class TwilioVoiceInput(InputChannel):
     def __init__(
         self,
-        initial_prompt: Optional[Text],
         reprompt_fallback_phrase: Optional[Text],
         assistant_voice: Optional[Text],
         speech_timeout: Text = "5",
@@ -128,14 +141,12 @@ class TwilioVoiceInput(InputChannel):
         """Creates a connection to Twilio voice.
         Args:
-            initial_prompt: text to use to prompt a conversation when call is answered.
             reprompt_fallback_phrase: phrase to use if no user response.
             assistant_voice: name of the assistant voice to use.
             speech_timeout: how long to pause when user finished speaking.
             speech_model: type of transcription model to use from Twilio.
             enhanced: toggle to use Twilio's premium speech transcription model.
         """
-        self.initial_prompt = initial_prompt
         self.reprompt_fallback_phrase = reprompt_fallback_phrase
         self.assistant_voice = assistant_voice
         self.speech_timeout = speech_timeout
@@ -239,22 +250,43 @@ class TwilioVoiceInput(InputChannel):
             text = request.form.get("SpeechResult")
             input_channel = self.name()
             call_status = request.form.get("CallStatus")
+            metadata = {}
             collector = TwilioVoiceCollectingOutputChannel()
+            logger.debug(
+                "twilio_voice.webhook",
+                sender_id=sender_id,
+                text=text,
+                call_status=call_status,
+            )
             # Provide an initial greeting to answer the user's call.
             if (text is None) and (call_status == "ringing"):
-                text = self.initial_prompt
+                text = "/session_start"
+                metadata = asdict(map_call_params(request.form))
+            # when call is disconnected
+            if call_status == "completed":
+                text = "/session_end"
+                metadata = {"reason": "user disconnected"}
             # determine the response.
             if text is not None:
+                logger.info("twilio_voice.webhook.text_not_none", sender_id=sender_id)
                 await on_new_message(
-                    UserMessage(text, collector, sender_id, input_channel=input_channel)
+                    UserMessage(
+                        text,
+                        collector,
+                        sender_id,
+                        input_channel=input_channel,
+                        metadata=metadata,
+                    )
                 )
                 twilio_response = self._build_twilio_voice_response(collector.messages)
             # If the user doesn't respond resend the last message.
             else:
+                logger.info("twilio_voice.webhook.text_none", sender_id=sender_id)
                 # Get last user utterance from tracker.
                 tracker = await request.app.ctx.agent.tracker_store.retrieve(sender_id)
                 last_response = None
@@ -285,6 +317,7 @@ class TwilioVoiceInput(InputChannel):
         self, messages: List[Dict[Text, Any]]
     ) -> VoiceResponse:
         """Builds the Twilio Voice Response object."""
+        logger.debug("twilio_voice.build_twilio_voice_response", messages=messages)
         voice_response = VoiceResponse()
         gather = Gather(
             input="speech",
@@ -299,6 +332,11 @@ class TwilioVoiceInput(InputChannel):
         # Add a listener to the last message to listen for user response.
         for i, message in enumerate(messages):
             msg_text = message["text"]
+            # Check if the message is a hangup message.
+            if message.get("custom", {}).get("hangup"):
+                voice_response.hangup()
+                break
             if i + 1 == len(messages):
                 gather.say(msg_text, voice=self.assistant_voice)
                 voice_response.append(gather)
@@ -320,38 +358,23 @@ class TwilioVoiceCollectingOutputChannel(CollectingOutputChannel):
         """Name of the output channel."""
         return "twilio_voice"
-    @staticmethod
-    def _emoji_warning(text: Text) -> None:
-        """Raises a warning if text contains an emoji."""
-        emoji_regex = rasa.utils.io.get_emoji_regex()
-        if emoji_regex.findall(text):
-            rasa.shared.utils.io.raise_warning(
-                "Text contains an emoji in a voice response. "
-                "Review responses to provide a voice-friendly alternative."
-            )
     async def send_text_message(
         self, recipient_id: Text, text: Text, **kwargs: Any
     ) -> None:
         """Sends the text message after removing emojis."""
-        self._emoji_warning(text)
+        text = rasa.utils.io.remove_emojis(text)
         for message_part in text.strip().split("\n\n"):
             await self._persist_message(self._message(recipient_id, text=message_part))
     async def send_text_with_buttons(
         self,
-        recipient_id: Text,
-        text: Text,
-        buttons: List[Dict[Text, Any]],
+        recipient_id: str,
+        text: str,
+        buttons: List[Dict[str, Any]],
         **kwargs: Any,
     ) -> None:
-        """Convert buttons into a voice representation."""
-        self._emoji_warning(text)
-        await self._persist_message(self._message(recipient_id, text=text))
-        for b in buttons:
-            self._emoji_warning(b["title"])
-            await self._persist_message(self._message(recipient_id, text=b["title"]))
+        """Uses the concise button output format for voice channels."""
+        await self.send_text_with_buttons_concise(recipient_id, text, buttons, **kwargs)
     async def send_image_url(
         self, recipient_id: Text, image: Text, **kwargs: Any
@@ -365,3 +388,16 @@ class TwilioVoiceCollectingOutputChannel(CollectingOutputChannel):
             "with a visual elements such as images and emojis "
             "that are used in your voice channel."
         )
+    async def hangup(self, recipient_id: Text, **kwargs: Any) -> None:
+        """
+        Indicate that the conversation should be ended.
+        Parent class is a collecting output channel, so we don't actually hang up
+        but we add a custom message to the list of messages to be sent.
+        This message will be picked up by _build_twilio_voice_response
+        which will hang up the call.
+        """
+        await self._persist_message(
+            self._message(recipient_id, custom={"hangup": True})
+        )

rasa/core/channels/voice_ready/utils.py ADDED Viewed

@@ -0,0 +1,37 @@
+import structlog
+from dataclasses import dataclass
+from typing import Optional
+structlogger = structlog.get_logger()
+def validate_voice_license_scope() -> None:
+    from rasa.utils.licensing import (
+        PRODUCT_AREA,
+        VOICE_SCOPE,
+        validate_license_from_env,
+    )
+    """Validate that the correct license scope is present."""
+    structlogger.info(
+        f"Validating current Rasa Pro license scope which must include "
+        f"the '{VOICE_SCOPE}' scope to use the voice channel."
+    )
+    voice_product_scope = PRODUCT_AREA + " " + VOICE_SCOPE
+    validate_license_from_env(product_area=voice_product_scope)
+@dataclass
+class CallParameters:
+    """Standardized call parameters for voice channels."""
+    call_id: str
+    user_phone: str
+    bot_phone: str
+    user_name: Optional[str] = None
+    user_host: Optional[str] = None
+    bot_host: Optional[str] = None
+    direction: Optional[str] = None
+    stream_id: Optional[str] = None

rasa/core/channels/voice_stream/asr/__init__.py ADDED Viewed

File without changes

rasa/core/channels/voice_stream/asr/asr_engine.py ADDED Viewed

@@ -0,0 +1,89 @@
+from dataclasses import dataclass
+from typing import (
+    Dict,
+    AsyncIterator,
+    Any,
+    Generic,
+    Optional,
+    Tuple,
+    Type,
+    TypeVar,
+)
+from websockets.legacy.client import WebSocketClientProtocol
+from rasa.core.channels.voice_stream.asr.asr_event import ASREvent
+from rasa.core.channels.voice_stream.audio_bytes import RasaAudioBytes
+from rasa.core.channels.voice_stream.util import MergeableConfig
+from rasa.shared.exceptions import ConnectionException
+from rasa.shared.utils.common import validate_environment
+T = TypeVar("T", bound="ASREngineConfig")
+E = TypeVar("E", bound="ASREngine")
+@dataclass
+class ASREngineConfig(MergeableConfig):
+    pass
+class ASREngine(Generic[T]):
+    required_env_vars: Tuple[str, ...] = ()
+    required_packages: Tuple[str, ...] = ()
+    def __init__(self, config: Optional[T] = None):
+        self.config = self.get_default_config().merge(config)
+        self.asr_socket: Optional[WebSocketClientProtocol] = None
+        validate_environment(
+            self.required_env_vars,
+            self.required_packages,
+            f"ASR Engine {self.__class__.__name__}",
+        )
+    async def connect(self) -> None:
+        self.asr_socket = await self.open_websocket_connection()
+    async def open_websocket_connection(self) -> WebSocketClientProtocol:
+        """Connect to the ASR system."""
+        raise NotImplementedError
+    @classmethod
+    def from_config_dict(cls: Type[E], config: Dict) -> E:
+        raise NotImplementedError
+    async def close_connection(self) -> None:
+        if self.asr_socket:
+            await self.asr_socket.close()
+    async def signal_audio_done(self) -> None:
+        """Signal to the ASR Api that you are done sending data."""
+        raise NotImplementedError
+    async def send_audio_chunks(self, chunk: RasaAudioBytes) -> None:
+        """Send audio chunks to the ASR system via the websocket."""
+        if self.asr_socket is None:
+            raise ConnectionException("Websocket not connected.")
+        engine_bytes = self.rasa_audio_bytes_to_engine_bytes(chunk)
+        await self.asr_socket.send(engine_bytes)
+    def rasa_audio_bytes_to_engine_bytes(self, chunk: RasaAudioBytes) -> bytes:
+        """Convert RasaAudioBytes to bytes usable by this engine."""
+        raise NotImplementedError
+    async def stream_asr_events(self) -> AsyncIterator[ASREvent]:
+        """Stream the events returned by the ASR system as it is fed audio bytes."""
+        if self.asr_socket is None:
+            raise ConnectionException("Websocket not connected.")
+        async for message in self.asr_socket:
+            asr_event = self.engine_event_to_asr_event(message)
+            if asr_event:
+                yield asr_event
+    def engine_event_to_asr_event(self, e: Any) -> Optional[ASREvent]:
+        """Translate an engine event to a common ASREvent."""
+        raise NotImplementedError
+    @staticmethod
+    def get_default_config() -> T:
+        """Get the default config for this component."""
+        raise NotImplementedError

rasa/core/channels/voice_stream/asr/asr_event.py ADDED Viewed

@@ -0,0 +1,18 @@
+from dataclasses import dataclass
+@dataclass
+class ASREvent:
+    @classmethod
+    def name(cls) -> str:
+        return cls.__name__
+@dataclass
+class NewTranscript(ASREvent):
+    text: str
+@dataclass
+class UserIsSpeaking(ASREvent):
+    pass

rasa/core/channels/voice_stream/asr/azure.py ADDED Viewed

@@ -0,0 +1,129 @@
+import os
+from dataclasses import dataclass
+from typing import Any, Dict, Optional, AsyncIterator
+import asyncio
+from rasa.core.channels.voice_stream.asr.asr_engine import ASREngine, ASREngineConfig
+from rasa.core.channels.voice_stream.asr.asr_event import (
+    ASREvent,
+    NewTranscript,
+    UserIsSpeaking,
+)
+from rasa.core.channels.voice_stream.audio_bytes import HERTZ, RasaAudioBytes
+from rasa.shared.constants import AZURE_SPEECH_API_KEY_ENV_VAR
+from rasa.shared.exceptions import ConnectionException
+@dataclass
+class AzureASRConfig(ASREngineConfig):
+    language: Optional[str] = None
+    speech_region: Optional[str] = None
+class AzureASR(ASREngine[AzureASRConfig]):
+    required_env_vars = (AZURE_SPEECH_API_KEY_ENV_VAR,)
+    required_packages = ("azure.cognitiveservices.speech",)
+    def __init__(self, config: Optional[AzureASRConfig] = None):
+        super().__init__(config)
+        import azure.cognitiveservices.speech as speechsdk
+        self.speech_recognizer: Optional[speechsdk.SpeechRecognizer] = None
+        self.stream: Optional[speechsdk.audio.PushAudioInputStream] = None
+        self.is_recognizing = False
+        self.queue: asyncio.Queue[speechsdk.SpeechRecognitionEventArgs] = (
+            asyncio.Queue()
+        )
+    @staticmethod
+    def validate_environment() -> None:
+        """Make sure all needed requirements for this component are met."""
+    def signal_user_is_speaking(self, event: Any) -> None:
+        """Replace the azure event with a generic is speaking event."""
+        self.fill_queue(UserIsSpeaking())
+    def fill_queue(self, event: Any) -> None:
+        """Either puts the event or a dedicated ASR Event into the queue."""
+        self.queue.put_nowait(event)
+    async def connect(self) -> None:
+        import azure.cognitiveservices.speech as speechsdk
+        speech_config = speechsdk.SpeechConfig(
+            subscription=os.environ[AZURE_SPEECH_API_KEY_ENV_VAR],
+            region=self.config.speech_region,
+        )
+        audio_format = speechsdk.audio.AudioStreamFormat(
+            samples_per_second=HERTZ,
+            bits_per_sample=8,
+            channels=1,
+            wave_stream_format=speechsdk.AudioStreamWaveFormat.MULAW,
+        )
+        self.stream = speechsdk.audio.PushAudioInputStream(stream_format=audio_format)
+        audio_config = speechsdk.audio.AudioConfig(stream=self.stream)
+        self.speech_recognizer = speechsdk.SpeechRecognizer(
+            speech_config=speech_config,
+            language=self.config.language,
+            audio_config=audio_config,
+        )
+        self.speech_recognizer.recognized.connect(self.fill_queue)
+        self.speech_recognizer.recognizing.connect(self.signal_user_is_speaking)
+        self.speech_recognizer.start_continuous_recognition_async()
+        self.is_recognizing = True
+    async def close_connection(self) -> None:
+        if self.speech_recognizer is None:
+            raise ConnectionException("Websocket not connected.")
+        self.speech_recognizer.stop_continuous_recognition_async()
+    async def signal_audio_done(self) -> None:
+        """Signal to the ASR Api that you are done sending data."""
+        self.is_recognizing = False
+    def rasa_audio_bytes_to_engine_bytes(self, chunk: RasaAudioBytes) -> bytes:
+        """Convert RasaAudioBytes to bytes usable by this engine."""
+        return chunk
+    async def send_audio_chunks(self, chunk: RasaAudioBytes) -> None:
+        """Send audio chunks to the ASR system via the websocket."""
+        if self.speech_recognizer is None or self.stream is None:
+            raise ConnectionException("ASR not connected.")
+        engine_bytes = self.rasa_audio_bytes_to_engine_bytes(chunk)
+        self.stream.write(engine_bytes)
+    async def stream_asr_events(self) -> AsyncIterator[ASREvent]:
+        """Stream the events returned by the ASR system as it is fed audio bytes."""
+        if self.speech_recognizer is None:
+            raise ConnectionException("Websocket not connected.")
+        while self.is_recognizing or not self.queue.empty():
+            try:
+                message = await asyncio.wait_for(self.queue.get(), timeout=2)
+                asr_event = self.engine_event_to_asr_event(message)
+                if asr_event:
+                    yield asr_event
+            except asyncio.TimeoutError:
+                pass
+    def engine_event_to_asr_event(self, e: Any) -> Optional[ASREvent]:
+        """Translate an engine event to a common ASREvent."""
+        import azure.cognitiveservices.speech as speechsdk
+        if isinstance(e, speechsdk.SpeechRecognitionEventArgs) and isinstance(
+            e.result, speechsdk.SpeechRecognitionResult
+        ):
+            return NewTranscript(e.result.text)
+        if isinstance(e, ASREvent):
+            # transformation happened before
+            return e
+        return None
+    @staticmethod
+    def get_default_config() -> AzureASRConfig:
+        return AzureASRConfig("en-US", "germanywestcentral")
+    @classmethod
+    def from_config_dict(cls, config: Dict) -> "AzureASR":
+        return AzureASR(AzureASRConfig.from_dict(config))

rasa/core/channels/voice_stream/asr/deepgram.py ADDED Viewed

@@ -0,0 +1,90 @@
+from dataclasses import dataclass
+from typing import Any, Dict, Optional
+import json
+import os
+import websockets
+from websockets.legacy.client import WebSocketClientProtocol
+from rasa.core.channels.voice_stream.asr.asr_engine import ASREngine, ASREngineConfig
+from rasa.core.channels.voice_stream.asr.asr_event import (
+    ASREvent,
+    NewTranscript,
+    UserIsSpeaking,
+)
+from rasa.core.channels.voice_stream.audio_bytes import HERTZ, RasaAudioBytes
+from rasa.shared.constants import DEEPGRAM_API_KEY_ENV_VAR
+@dataclass
+class DeepgramASRConfig(ASREngineConfig):
+    endpoint: Optional[str] = None
+    # number of miliseconds of silence to determine end of speech
+    endpointing: Optional[int] = None
+    language: Optional[str] = None
+    model: Optional[str] = None
+    smart_format: Optional[bool] = None
+class DeepgramASR(ASREngine[DeepgramASRConfig]):
+    required_env_vars = (DEEPGRAM_API_KEY_ENV_VAR,)
+    def __init__(self, config: Optional[DeepgramASRConfig] = None):
+        super().__init__(config)
+        self.accumulated_transcript = ""
+    async def open_websocket_connection(self) -> WebSocketClientProtocol:
+        """Connect to the ASR system."""
+        deepgram_api_key = os.environ[DEEPGRAM_API_KEY_ENV_VAR]
+        extra_headers = {"Authorization": f"Token {deepgram_api_key}"}
+        api_url = self._get_api_url()
+        query_params = self._get_query_params()
+        return await websockets.connect(  # type: ignore
+            api_url + query_params,
+            extra_headers=extra_headers,
+        )
+    def _get_api_url(self) -> str:
+        return f"wss://{self.config.endpoint}/v1/listen?"
+    def _get_query_params(self) -> str:
+        return (
+            f"encoding=mulaw&sample_rate={HERTZ}&endpointing={self.config.endpointing}"
+            f"&vad_events=true&language={self.config.language}&interim_results=true"
+            f"&model={self.config.model}&smart_format={str(self.config.smart_format).lower()}"
+        )
+    async def signal_audio_done(self) -> None:
+        """Signal to the ASR Api that you are done sending data."""
+        if self.asr_socket is None:
+            raise AttributeError("Websocket not connected.")
+        await self.asr_socket.send(json.dumps({"type": "CloseStream"}))
+    def rasa_audio_bytes_to_engine_bytes(self, chunk: RasaAudioBytes) -> bytes:
+        """Convert RasaAudioBytes to bytes usable by this engine."""
+        return chunk
+    def engine_event_to_asr_event(self, e: Any) -> Optional[ASREvent]:
+        """Translate an engine event to a common ASREvent."""
+        data = json.loads(e)
+        if "is_final" in data:
+            transcript = data["channel"]["alternatives"][0]["transcript"]
+            if data["is_final"]:
+                if data.get("speech_final"):
+                    full_transcript = self.accumulated_transcript + transcript
+                    self.accumulated_transcript = ""
+                    if full_transcript:
+                        return NewTranscript(full_transcript)
+                else:
+                    self.accumulated_transcript += transcript
+            elif transcript:
+                return UserIsSpeaking()
+        return None
+    @staticmethod
+    def get_default_config() -> DeepgramASRConfig:
+        return DeepgramASRConfig("api.deepgram.com", 400, "en", "nova-2-general", True)
+    @classmethod
+    def from_config_dict(cls, config: Dict) -> "DeepgramASR":
+        return DeepgramASR(DeepgramASRConfig.from_dict(config))

rasa/core/channels/voice_stream/audio_bytes.py ADDED Viewed

@@ -0,0 +1,8 @@
+from typing import NewType
+# a common intermediate audio byte format that acts as a common data format,
+# to prevent quadratic complexity between formats of channels, asr engines,
+# and tts engines
+# currently corresponds to raw wave, 8khz, 8bit, mono channel, mulaw encoding
+RasaAudioBytes = NewType("RasaAudioBytes", bytes)
+HERTZ = 8000

rasa/core/channels/voice_stream/browser_audio.py ADDED Viewed

@@ -0,0 +1,107 @@
+import audioop
+import base64
+import json
+import structlog
+import uuid
+from typing import Any, Awaitable, Callable, Optional, Tuple
+from sanic import Blueprint, HTTPResponse, Request, response
+from sanic import Websocket  # type: ignore
+from rasa.core.channels import UserMessage
+from rasa.core.channels.voice_ready.utils import CallParameters
+from rasa.core.channels.voice_stream.call_state import call_state
+from rasa.core.channels.voice_stream.tts.tts_engine import TTSEngine
+from rasa.core.channels.voice_stream.audio_bytes import RasaAudioBytes
+from rasa.core.channels.voice_stream.voice_channel import (
+    ContinueConversationAction,
+    EndConversationAction,
+    NewAudioAction,
+    VoiceChannelAction,
+    VoiceInputChannel,
+    VoiceOutputChannel,
+)
+logger = structlog.get_logger()
+class BrowserAudioOutputChannel(VoiceOutputChannel):
+    @classmethod
+    def name(cls) -> str:
+        return "browser_audio"
+    def rasa_audio_bytes_to_channel_bytes(
+        self, rasa_audio_bytes: RasaAudioBytes
+    ) -> bytes:
+        return audioop.ulaw2lin(rasa_audio_bytes, 4)
+    def channel_bytes_to_message(self, recipient_id: str, channel_bytes: bytes) -> str:
+        return json.dumps({"audio": base64.b64encode(channel_bytes).decode("utf-8")})
+    def create_marker_message(self, recipient_id: str) -> Tuple[str, str]:
+        message_id = uuid.uuid4().hex
+        return json.dumps({"marker": message_id}), message_id
+class BrowserAudioInputChannel(VoiceInputChannel):
+    @classmethod
+    def name(cls) -> str:
+        return "browser_audio"
+    def channel_bytes_to_rasa_audio_bytes(self, input_bytes: bytes) -> RasaAudioBytes:
+        return RasaAudioBytes(audioop.lin2ulaw(input_bytes, 4))
+    async def collect_call_parameters(
+        self, channel_websocket: Websocket
+    ) -> Optional[CallParameters]:
+        call_id = f"inspect-{uuid.uuid4()}"
+        return CallParameters(call_id, "local", "local", stream_id=call_id)
+    def map_input_message(
+        self,
+        message: Any,
+    ) -> VoiceChannelAction:
+        data = json.loads(message)
+        if "audio" in data:
+            channel_bytes = base64.b64decode(data["audio"])
+            audio_bytes = self.channel_bytes_to_rasa_audio_bytes(channel_bytes)
+            return NewAudioAction(audio_bytes)
+        elif "marker" in data:
+            if data["marker"] == call_state.latest_bot_audio_id:
+                # Just finished streaming last audio bytes
+                call_state.is_bot_speaking = False  # type: ignore[attr-defined]
+                if call_state.should_hangup:
+                    logger.debug(
+                        "browser_audio.hangup", marker=call_state.latest_bot_audio_id
+                    )
+                    return EndConversationAction()
+            else:
+                call_state.is_bot_speaking = True  # type: ignore[attr-defined]
+        return ContinueConversationAction()
+    def create_output_channel(
+        self, voice_websocket: Websocket, tts_engine: TTSEngine
+    ) -> VoiceOutputChannel:
+        return BrowserAudioOutputChannel(
+            voice_websocket,
+            tts_engine,
+            self.tts_cache,
+        )
+    def blueprint(
+        self, on_new_message: Callable[[UserMessage], Awaitable[Any]]
+    ) -> Blueprint:
+        """Defines a Sanic bluelogger.debug."""
+        blueprint = Blueprint("browser_audio", __name__)
+        @blueprint.route("/", methods=["GET"])
+        async def health(_: Request) -> HTTPResponse:
+            return response.json({"status": "ok"})
+        @blueprint.websocket("/websocket")  # type: ignore
+        async def handle_message(request: Request, ws: Websocket) -> None:
+            await self.run_audio_streaming(on_new_message, ws)
+        return blueprint

rasa-pro 3.10.15__py3-none-any.whl → 3.11.0__py3-none-any.whl

Potentially problematic release.

rasa-pro 3.10.15py3-none-any.whl → 3.11.0py3-none-any.whl