PyPI - rasa-pro - Versions diffs - 3.12.0.dev12__py3-none-any.whl → 3.12.0rc1__py3-none-any.whl - Mend

rasa-pro 3.12.0.dev12py3-none-any.whl → 3.12.0rc1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of rasa-pro might be problematic. Click here for more details.

Files changed (153) hide show

rasa/anonymization/anonymization_rule_executor.py +16 -10
rasa/cli/data.py +16 -0
rasa/cli/inspect.py +20 -1
rasa/cli/project_templates/calm/config.yml +2 -2
rasa/cli/project_templates/calm/endpoints.yml +2 -2
rasa/cli/shell.py +3 -3
rasa/cli/utils.py +12 -0
rasa/core/actions/action.py +99 -193
rasa/core/actions/action_handle_digressions.py +142 -0
rasa/core/actions/action_run_slot_rejections.py +16 -4
rasa/core/actions/forms.py +10 -5
rasa/core/channels/__init__.py +4 -0
rasa/core/channels/studio_chat.py +19 -0
rasa/core/channels/telegram.py +42 -24
rasa/core/channels/voice_ready/audiocodes.py +42 -23
rasa/core/channels/voice_ready/utils.py +1 -1
rasa/core/channels/voice_stream/asr/asr_engine.py +10 -4
rasa/core/channels/voice_stream/asr/azure.py +14 -1
rasa/core/channels/voice_stream/asr/deepgram.py +20 -4
rasa/core/channels/voice_stream/audiocodes.py +264 -0
rasa/core/channels/voice_stream/browser_audio.py +5 -1
rasa/core/channels/voice_stream/call_state.py +10 -1
rasa/core/channels/voice_stream/genesys.py +335 -0
rasa/core/channels/voice_stream/tts/azure.py +11 -2
rasa/core/channels/voice_stream/tts/cartesia.py +29 -10
rasa/core/channels/voice_stream/twilio_media_streams.py +2 -1
rasa/core/channels/voice_stream/voice_channel.py +25 -3
rasa/core/constants.py +2 -0
rasa/core/migrate.py +2 -2
rasa/core/nlg/contextual_response_rephraser.py +18 -1
rasa/core/nlg/generator.py +83 -15
rasa/core/nlg/response.py +6 -3
rasa/core/nlg/translate.py +55 -0
rasa/core/policies/enterprise_search_prompt_with_citation_template.jinja2 +1 -1
rasa/core/policies/flows/flow_executor.py +47 -46
rasa/core/processor.py +72 -9
rasa/core/run.py +4 -3
rasa/dialogue_understanding/commands/can_not_handle_command.py +20 -2
rasa/dialogue_understanding/commands/cancel_flow_command.py +80 -4
rasa/dialogue_understanding/commands/change_flow_command.py +20 -2
rasa/dialogue_understanding/commands/chit_chat_answer_command.py +20 -2
rasa/dialogue_understanding/commands/clarify_command.py +29 -3
rasa/dialogue_understanding/commands/command.py +1 -16
rasa/dialogue_understanding/commands/command_syntax_manager.py +55 -0
rasa/dialogue_understanding/commands/correct_slots_command.py +11 -2
rasa/dialogue_understanding/commands/handle_digressions_command.py +150 -0
rasa/dialogue_understanding/commands/human_handoff_command.py +20 -2
rasa/dialogue_understanding/commands/knowledge_answer_command.py +20 -2
rasa/dialogue_understanding/commands/prompt_command.py +94 -0
rasa/dialogue_understanding/commands/repeat_bot_messages_command.py +20 -2
rasa/dialogue_understanding/commands/set_slot_command.py +29 -15
rasa/dialogue_understanding/commands/skip_question_command.py +20 -2
rasa/dialogue_understanding/commands/start_flow_command.py +61 -2
rasa/dialogue_understanding/commands/utils.py +98 -4
rasa/dialogue_understanding/constants.py +1 -0
rasa/dialogue_understanding/generator/__init__.py +2 -0
rasa/dialogue_understanding/generator/command_generator.py +110 -73
rasa/dialogue_understanding/generator/command_parser.py +16 -13
rasa/dialogue_understanding/generator/constants.py +3 -0
rasa/dialogue_understanding/generator/llm_based_command_generator.py +170 -5
rasa/dialogue_understanding/generator/llm_command_generator.py +5 -3
rasa/dialogue_understanding/generator/multi_step/multi_step_llm_command_generator.py +26 -4
rasa/dialogue_understanding/generator/nlu_command_adapter.py +44 -3
rasa/dialogue_understanding/generator/prompt_templates/__init__.py +0 -0
rasa/dialogue_understanding/generator/prompt_templates/command_prompt_template.jinja2 +60 -0
rasa/dialogue_understanding/generator/prompt_templates/command_prompt_v2_claude_3_5_sonnet_20240620_template.jinja2 +77 -0
rasa/dialogue_understanding/generator/prompt_templates/command_prompt_v2_default.jinja2 +68 -0
rasa/dialogue_understanding/generator/{single_step/command_prompt_template.jinja2 → prompt_templates/command_prompt_v2_gpt_4o_2024_11_20_template.jinja2} +1 -1
rasa/dialogue_understanding/generator/single_step/compact_llm_command_generator.py +460 -0
rasa/dialogue_understanding/generator/single_step/single_step_llm_command_generator.py +12 -318
rasa/dialogue_understanding/generator/utils.py +32 -1
rasa/dialogue_understanding/patterns/collect_information.py +1 -1
rasa/dialogue_understanding/patterns/correction.py +13 -1
rasa/dialogue_understanding/patterns/default_flows_for_patterns.yml +78 -2
rasa/dialogue_understanding/patterns/handle_digressions.py +81 -0
rasa/dialogue_understanding/patterns/validate_slot.py +65 -0
rasa/dialogue_understanding/processor/command_processor.py +154 -28
rasa/dialogue_understanding/utils.py +31 -0
rasa/dialogue_understanding_test/README.md +50 -0
rasa/dialogue_understanding_test/du_test_case.py +28 -8
rasa/dialogue_understanding_test/du_test_result.py +13 -9
rasa/dialogue_understanding_test/io.py +14 -0
rasa/dialogue_understanding_test/test_case_simulation/test_case_tracker_simulator.py +3 -3
rasa/e2e_test/utils/io.py +0 -37
rasa/engine/graph.py +1 -0
rasa/engine/language.py +140 -0
rasa/engine/recipes/config_files/default_config.yml +4 -0
rasa/engine/recipes/default_recipe.py +2 -0
rasa/engine/recipes/graph_recipe.py +2 -0
rasa/engine/storage/local_model_storage.py +1 -0
rasa/engine/storage/storage.py +4 -1
rasa/model_manager/runner_service.py +7 -4
rasa/model_manager/socket_bridge.py +7 -6
rasa/model_manager/warm_rasa_process.py +0 -1
rasa/model_training.py +24 -27
rasa/shared/constants.py +15 -13
rasa/shared/core/constants.py +30 -3
rasa/shared/core/domain.py +13 -20
rasa/shared/core/events.py +13 -2
rasa/shared/core/flows/constants.py +11 -0
rasa/shared/core/flows/flow.py +100 -19
rasa/shared/core/flows/flows_yaml_schema.json +69 -3
rasa/shared/core/flows/steps/collect.py +19 -37
rasa/shared/core/flows/utils.py +43 -4
rasa/shared/core/flows/validation.py +1 -1
rasa/shared/core/slot_mappings.py +350 -111
rasa/shared/core/slots.py +154 -3
rasa/shared/core/trackers.py +77 -2
rasa/shared/importers/importer.py +50 -2
rasa/shared/nlu/constants.py +1 -0
rasa/shared/nlu/training_data/schemas/responses.yml +19 -12
rasa/shared/providers/_configs/azure_entra_id_config.py +541 -0
rasa/shared/providers/_configs/azure_openai_client_config.py +138 -3
rasa/shared/providers/_configs/client_config.py +3 -1
rasa/shared/providers/_configs/default_litellm_client_config.py +3 -1
rasa/shared/providers/_configs/huggingface_local_embedding_client_config.py +3 -1
rasa/shared/providers/_configs/litellm_router_client_config.py +3 -1
rasa/shared/providers/_configs/model_group_config.py +4 -2
rasa/shared/providers/_configs/oauth_config.py +33 -0
rasa/shared/providers/_configs/openai_client_config.py +3 -1
rasa/shared/providers/_configs/rasa_llm_client_config.py +3 -1
rasa/shared/providers/_configs/self_hosted_llm_client_config.py +3 -1
rasa/shared/providers/constants.py +6 -0
rasa/shared/providers/embedding/azure_openai_embedding_client.py +28 -3
rasa/shared/providers/embedding/litellm_router_embedding_client.py +3 -1
rasa/shared/providers/llm/_base_litellm_client.py +42 -17
rasa/shared/providers/llm/azure_openai_llm_client.py +81 -25
rasa/shared/providers/llm/default_litellm_llm_client.py +3 -1
rasa/shared/providers/llm/litellm_router_llm_client.py +29 -8
rasa/shared/providers/llm/llm_client.py +23 -7
rasa/shared/providers/llm/openai_llm_client.py +9 -3
rasa/shared/providers/llm/rasa_llm_client.py +11 -2
rasa/shared/providers/llm/self_hosted_llm_client.py +30 -11
rasa/shared/providers/router/_base_litellm_router_client.py +3 -1
rasa/shared/providers/router/router_client.py +3 -1
rasa/shared/utils/constants.py +3 -0
rasa/shared/utils/llm.py +31 -8
rasa/shared/utils/pykwalify_extensions.py +24 -0
rasa/shared/utils/schemas/domain.yml +26 -1
rasa/telemetry.py +45 -14
rasa/tracing/config.py +2 -0
rasa/tracing/constants.py +12 -0
rasa/tracing/instrumentation/instrumentation.py +36 -0
rasa/tracing/instrumentation/metrics.py +41 -0
rasa/tracing/metric_instrument_provider.py +40 -0
rasa/utils/common.py +0 -1
rasa/validator.py +561 -89
rasa/version.py +1 -1
{rasa_pro-3.12.0.dev12.dist-info → rasa_pro-3.12.0rc1.dist-info}/METADATA +2 -1
{rasa_pro-3.12.0.dev12.dist-info → rasa_pro-3.12.0rc1.dist-info}/RECORD +153 -134
{rasa_pro-3.12.0.dev12.dist-info → rasa_pro-3.12.0rc1.dist-info}/NOTICE +0 -0
{rasa_pro-3.12.0.dev12.dist-info → rasa_pro-3.12.0rc1.dist-info}/WHEEL +0 -0
{rasa_pro-3.12.0.dev12.dist-info → rasa_pro-3.12.0rc1.dist-info}/entry_points.txt +0 -0

rasa/shared/utils/llm.py CHANGED Viewed

@@ -1,3 +1,4 @@
+import importlib.resources
 import json
 from copy import deepcopy
 from functools import wraps
@@ -19,6 +20,8 @@ import structlog
 import rasa.shared.utils.io
 from rasa.core.utils import AvailableEndpoints
 from rasa.shared.constants import (
+    DEFAULT_PROMPT_PACKAGE_NAME,
+    MODEL_CONFIG_KEY,
     MODEL_GROUP_CONFIG_KEY,
     MODEL_GROUP_ID_CONFIG_KEY,
     MODELS_CONFIG_KEY,
@@ -29,9 +32,7 @@ from rasa.shared.constants import (
 )
 from rasa.shared.core.events import BotUttered, UserUttered
 from rasa.shared.core.slots import BooleanSlot, CategoricalSlot, Slot
-from rasa.shared.engine.caching import (
-    get_local_cache_location,
-)
+from rasa.shared.engine.caching import get_local_cache_location
 from rasa.shared.exceptions import (
     FileIOException,
     FileNotFoundException,
@@ -355,13 +356,13 @@ def _combine_single_model_configs(
         )
         # Checks for deprecated keys, resolves aliases and returns a valid config.
         # This is done to ensure that the custom config is valid.
-        return client_config_clazz.from_dict(custom_config).to_dict()
+        return client_config_clazz.from_dict(deepcopy(custom_config)).to_dict()
     # If the provider is the same in both configs
     # OR provider is not specified in the custom config
     # perform MERGE by overriding the default config keys and values
     # with custom config keys and values.
-    merged_config = {**default_config.copy(), **custom_config.copy()}
+    merged_config = {**deepcopy(default_config), **deepcopy(custom_config)}
     # Check for deprecated keys, resolve aliases and return a valid config.
     # This is done to ensure that the merged config is valid.
     default_config_clazz = get_client_config_class_from_provider(
@@ -512,7 +513,7 @@ def llm_client_factory(
     Returns:
         Instantiated LLM based on the configuration.
     """
-    config = combine_custom_and_default_config(custom_config, default_config)
+    config = combine_custom_and_default_config(deepcopy(custom_config), default_config)
     ensure_cache()
@@ -641,7 +642,7 @@ def embedder_client_factory(
     Returns:
         Instantiated Embedder based on the configuration.
     """
-    config = combine_custom_and_default_config(custom_config, default_config)
+    config = combine_custom_and_default_config(deepcopy(custom_config), default_config)
     ensure_cache()
@@ -675,12 +676,34 @@ def get_prompt_template(
     return default_prompt_template
+def get_default_prompt_template_based_on_model(
+    config: Dict[str, Any],
+    model_prompt_mapping: Dict[str, Any],
+    fallback_prompt_path: str,
+) -> Text:
+    """Returns the default prompt template based on the model name.
+    Args:
+        config: The model config.
+        model_prompt_mapping: The mapping of model name to prompt template.
+        fallback_prompt_path: The fallback prompt path.
+    Returns:
+        The default prompt template.
+    """
+    provider = config.get(PROVIDER_CONFIG_KEY)
+    model = config.get(MODEL_CONFIG_KEY, "")
+    model_name = model if provider and provider in model else f"{provider}/{model}"
+    prompt_file_path = model_prompt_mapping.get(model_name, fallback_prompt_path)
+    return importlib.resources.read_text(DEFAULT_PROMPT_PACKAGE_NAME, prompt_file_path)
 def allowed_values_for_slot(slot: Slot) -> Union[str, None]:
     """Get the allowed values for a slot."""
     if isinstance(slot, BooleanSlot):
         return str([True, False])
     if isinstance(slot, CategoricalSlot):
-        return str([v for v in slot.values if v != "__other__"] + ["other"])
+        return str([v for v in slot.values if v != "__other__"])
     else:
         return None

rasa/shared/utils/pykwalify_extensions.py CHANGED Viewed

@@ -8,6 +8,11 @@ from typing import Any, Dict, List, Text, Union
 from pykwalify.errors import SchemaError
+from rasa.shared.utils.constants import (
+    RASA_PRO_BETA_PREDICATES_IN_RESPONSE_CONDITIONS_ENV_VAR_NAME,
+)
+from rasa.utils.beta import ensure_beta_feature_is_enabled
 def require_response_keys(
     responses: List[Dict[Text, Any]], _: Dict, __: Text
@@ -24,4 +29,23 @@ def require_response_keys(
                 "null 'text' value in response."
             )
+        conditions = response.get("condition", [])
+        if isinstance(conditions, str):
+            ensure_beta_feature_is_enabled(
+                "predicates in response conditions",
+                RASA_PRO_BETA_PREDICATES_IN_RESPONSE_CONDITIONS_ENV_VAR_NAME,
+            )
+            continue
+        for condition in conditions:
+            if not isinstance(condition, dict):
+                return SchemaError("Condition must be a dictionary.")
+            if not all(key in condition for key in ("type", "name", "value")):
+                return SchemaError(
+                    "Condition must have 'type', 'name', and 'value' keys."
+                )
+            if condition.get("type") != "slot":
+                return SchemaError("Condition type must be of type `slot`.")
     return True

rasa/shared/utils/schemas/domain.yml CHANGED Viewed

@@ -78,7 +78,6 @@ mapping:
           mappings:
            type: "seq"
            required: False
-           allowempty: False
            sequence:
               - type: "map"
                 allowempty: True
@@ -99,6 +98,11 @@ mapping:
                     type: "any"
                   action:
                     type: "str"
+                  run_action_every_turn:
+                    type: "str"
+                  coexistence_system:
+                    type: "str"
+                    enum: ["NLU", "CALM", "SHARED"]
                   conditions:
                     type: "seq"
                     sequence:
@@ -112,6 +116,27 @@ mapping:
                           active_flow:
                             type: "str"
                             nullable: True
+          validation:
+            type: map
+            required: false
+            mapping:
+              rejections:
+                type: seq
+                required: true
+                sequence:
+                  - type: map
+                    mapping:
+                      if:
+                        type: str
+                        required: true
+                      utter:
+                        type: str
+                        required: true
+              refill_utter:
+                type: str
+                required: false
+                nullable: false
   forms:
     type: "map"
     required: False

rasa/telemetry.py CHANGED Viewed

@@ -15,7 +15,7 @@ from collections import defaultdict
 from datetime import datetime
 from functools import wraps
 from pathlib import Path
-from typing import Any, Callable, Dict, List, Optional, Text
+from typing import Any, Callable, Dict, List, Optional, Text, Tuple
 import importlib_resources
 import requests
@@ -35,6 +35,7 @@ from rasa.constants import (
 )
 from rasa.engine.storage.local_model_storage import LocalModelStorage
 from rasa.shared.constants import (
+    ASSISTANT_ID_KEY,
     CONFIG_LANGUAGE_KEY,
     CONFIG_PIPELINE_KEY,
     CONFIG_POLICIES_KEY,
@@ -111,6 +112,7 @@ CI_ENVIRONMENT_TELL = [
 # https://rasa.com/docs/rasa-pro/telemetry/reference
 TRAINING_STARTED_EVENT = "Training Started"
 TRAINING_COMPLETED_EVENT = "Training Completed"
+TRAINING_FAILED_EVENT = "Training Failed"
 TELEMETRY_DISABLED_EVENT = "Telemetry Disabled"
 TELEMETRY_DATA_SPLIT_EVENT = "Training Data Split"
 TELEMETRY_DATA_VALIDATED_EVENT = "Training Data Validated"
@@ -527,7 +529,6 @@ def _send_request(url: Text, payload: Dict[Text, Any]) -> None:
     """
     if _is_telemetry_debug_enabled():
         print_telemetry_payload(payload)
-        return
     write_key = _get_telemetry_write_key()
     if not write_key:
@@ -976,6 +977,7 @@ def track_model_training(
         "language": config.get(CONFIG_LANGUAGE_KEY),
         "training_id": training_id,
         "type": model_type,
+        "assistant_id": config.get(ASSISTANT_ID_KEY),
         "pipeline": config.get(CONFIG_PIPELINE_KEY),
         "policies": config.get(CONFIG_POLICIES_KEY),
         "train_schema": config.get(CONFIG_TRAIN_SCHEMA),
@@ -1021,13 +1023,28 @@ def track_model_training(
         tracking_data,
     )
     start = datetime.now()
-    yield
+    try:
+        yield
+    except (Exception, SystemExit):
+        runtime = datetime.now() - start
+        _track(
+            TRAINING_FAILED_EVENT,
+            {
+                "training_id": training_id,
+                "assistant_id": config.get(ASSISTANT_ID_KEY),
+                "type": model_type,
+                "runtime": int(runtime.total_seconds()),
+            },
+        )
+        raise
     runtime = datetime.now() - start
     _track(
         TRAINING_COMPLETED_EVENT,
         {
             "training_id": training_id,
+            "assistant_id": config.get(ASSISTANT_ID_KEY),
             "type": model_type,
             "runtime": int(runtime.total_seconds()),
         },
@@ -1108,6 +1125,7 @@ def _get_llm_command_generator_config(config: Dict[str, Any]) -> Optional[Dict]:
     retrieval is enabled, and flow retrieval embedding model.
     """
     from rasa.dialogue_understanding.generator import (
+        CompactLLMCommandGenerator,
         LLMCommandGenerator,
         MultiStepLLMCommandGenerator,
         SingleStepLLMCommandGenerator,
@@ -1137,6 +1155,7 @@ def _get_llm_command_generator_config(config: Dict[str, Any]) -> Optional[Dict]:
                 LLMCommandGenerator.__name__,
                 SingleStepLLMCommandGenerator.__name__,
                 MultiStepLLMCommandGenerator.__name__,
+                CompactLLMCommandGenerator.__name__,
             ]:
                 return component
         return None
@@ -1326,24 +1345,28 @@ def track_server_start(
     """
     from rasa.core.utils import AvailableEndpoints
-    def project_fingerprint_from_model(
+    def project_fingerprint_and_assistant_id_from_model(
         _model_directory: Optional[Text],
-    ) -> Optional[Text]:
+    ) -> Tuple[Optional[Text], Optional[Text]]:
         """Gets project fingerprint from an app's loaded model."""
         if not model_directory:
-            return None
+            return None, None
         try:
             model_archive = model.get_local_model(_model_directory)
             metadata = LocalModelStorage.metadata_from_archive(model_archive)
-            return metadata.project_fingerprint
+            return metadata.project_fingerprint, metadata.assistant_id
         except Exception:
-            return None
+            return None, None
     if not endpoints:
         endpoints = AvailableEndpoints()
+    project, assistant_id = project_fingerprint_and_assistant_id_from_model(
+        model_directory
+    )
     _track(
         TELEMETRY_SERVER_STARTED_EVENT,
         {
@@ -1365,7 +1388,8 @@ def track_server_start(
             "endpoints_event_broker": endpoints.event_broker.type
             if endpoints.event_broker
             else None,
-            "project": project_fingerprint_from_model(model_directory),
+            "project": project,
+            "assistant_id": assistant_id,
         },
     )
@@ -1383,23 +1407,30 @@ def track_project_init(path: Text) -> None:
 @ensure_telemetry_enabled
-def track_shell_started(model_type: Text) -> None:
+def track_shell_started(model_type: Text, assistant_id: Text) -> None:
     """Track when a user starts a bot using rasa shell.
     Args:
         model_type: Type of the model, core / nlu or rasa.
     """
-    _track(TELEMETRY_SHELL_STARTED_EVENT, {"type": model_type})
+    _track(
+        TELEMETRY_SHELL_STARTED_EVENT,
+        {"type": model_type, "assistant_id": assistant_id},
+    )
 @ensure_telemetry_enabled
-def track_inspect_started(model_type: Text) -> None:
+def track_inspect_started(channel: Text, assistant_id: Text) -> None:
     """Track when a user starts a bot using rasa inspect.
     Args:
-        model_type: Type of the model, core / nlu or rasa.
+        channel: Type of channel used.
+        assistant_id: ID of the assistant being inspected.
     """
-    _track(TELEMETRY_INSPECT_STARTED_EVENT, {"type": model_type})
+    _track(
+        TELEMETRY_INSPECT_STARTED_EVENT,
+        {"type": channel, "assistant_id": assistant_id},
+    )
 @ensure_telemetry_enabled

rasa/tracing/config.py CHANGED Viewed

@@ -29,6 +29,7 @@ from rasa.dialogue_understanding.commands import (
     FreeFormAnswerCommand,
 )
 from rasa.dialogue_understanding.generator import (
+    CompactLLMCommandGenerator,
     LLMCommandGenerator,
     MultiStepLLMCommandGenerator,
     SingleStepLLMCommandGenerator,
@@ -110,6 +111,7 @@ def configure_tracing(tracer_provider: Optional[TracerProvider]) -> None:
         endpoint_config_class=EndpointConfig,
         grpc_custom_action_executor_class=GRPCCustomActionExecutor,
         single_step_llm_command_generator_class=SingleStepLLMCommandGenerator,
+        compact_llm_command_generator_class=CompactLLMCommandGenerator,
         multi_step_llm_command_generator_class=MultiStepLLMCommandGenerator,
         custom_action_executor_subclasses=custom_action_executor_subclasses,
         flow_retrieval_class=FlowRetrieval,

rasa/tracing/constants.py CHANGED Viewed

@@ -32,6 +32,18 @@ SINGLE_STEP_LLM_COMMAND_GENERATOR_PROMPT_TOKEN_USAGE_METRIC_NAME = (
 SINGLE_STEP_LLM_COMMAND_GENERATOR_LLM_RESPONSE_DURATION_METRIC_NAME = (
     "single_step_llm_command_generator_llm_response_duration"
 )
+COMPACT_LLM_COMMAND_GENERATOR_CPU_USAGE_METRIC_NAME = (
+    "compact_llm_command_generator_cpu_usage"
+)
+COMPACT_LLM_COMMAND_GENERATOR_MEMORY_USAGE_METRIC_NAME = (
+    "compact_llm_command_generator_memory_usage"
+)
+COMPACT_LLM_COMMAND_GENERATOR_PROMPT_TOKEN_USAGE_METRIC_NAME = (
+    "compact_llm_command_generator_prompt_token_usage"
+)
+COMPACT_LLM_COMMAND_GENERATOR_LLM_RESPONSE_DURATION_METRIC_NAME = (
+    "compact_llm_command_generator_llm_response_duration"
+)
 MULTI_STEP_LLM_COMMAND_GENERATOR_CPU_USAGE_METRIC_NAME = (
     "multi_step_llm_command_generator_cpu_usage"
 )

rasa/tracing/instrumentation/instrumentation.py CHANGED Viewed

@@ -41,6 +41,7 @@ from rasa.core.processor import MessageProcessor
 from rasa.core.tracker_store import TrackerStore
 from rasa.dialogue_understanding.commands import Command
 from rasa.dialogue_understanding.generator import (
+    CompactLLMCommandGenerator,
     LLMCommandGenerator,
     MultiStepLLMCommandGenerator,
     SingleStepLLMCommandGenerator,
@@ -64,6 +65,7 @@ from rasa.tracing.instrumentation.intentless_policy_instrumentation import (
 )
 from rasa.tracing.instrumentation.metrics import (
     record_callable_duration_metrics,
+    record_compact_llm_command_generator_metrics,
     record_llm_command_generator_metrics,
     record_multi_step_llm_command_generator_metrics,
     record_request_size_in_bytes,
@@ -286,6 +288,9 @@ LLMCommandGeneratorType = TypeVar("LLMCommandGeneratorType", bound=LLMCommandGen
 SingleStepLLMCommandGeneratorType = TypeVar(
     "SingleStepLLMCommandGeneratorType", bound=SingleStepLLMCommandGenerator
 )
+CompactLLMCommandGeneratorType = TypeVar(
+    "CompactLLMCommandGeneratorType", bound=CompactLLMCommandGenerator
+)
 MultiStepLLMCommandGeneratorType = TypeVar(
     "MultiStepLLMCommandGeneratorType", bound=MultiStepLLMCommandGenerator
 )
@@ -318,6 +323,9 @@ def instrument(
     single_step_llm_command_generator_class: Optional[
         Type[SingleStepLLMCommandGeneratorType]
     ] = None,
+    compact_llm_command_generator_class: Optional[
+        Type[CompactLLMCommandGeneratorType]
+    ] = None,
     multi_step_llm_command_generator_class: Optional[
         Type[MultiStepLLMCommandGeneratorType]
     ] = None,
@@ -368,6 +376,9 @@ def instrument(
     :param single_step_llm_command_generator_class: The `SingleStepLLMCommandGenerator`
         to be instrumented. If `None` is given, no `SingleStepLLMCommandGenerator` will
         be instrumented.
+    :param compact_llm_command_generator_class: The `CompactLLMCommandGenerator`
+        to be instrumented. If `None` is given, no `CompactLLMCommandGenerator` will
+        be instrumented.
     :param multi_step_llm_command_generator_class: The `MultiStepLLMCommandGenerator`
         to be instrumented. If `None` is given, no `MultiStepLLMCommandGenerator` will
         be instrumented.
@@ -492,6 +503,30 @@ def instrument(
         )
         mark_class_as_instrumented(single_step_llm_command_generator_class)
+    if compact_llm_command_generator_class is not None and not class_is_instrumented(
+        compact_llm_command_generator_class
+    ):
+        _instrument_method(
+            tracer_provider.get_tracer(compact_llm_command_generator_class.__module__),
+            compact_llm_command_generator_class,
+            "invoke_llm",
+            attribute_extractors.extract_attrs_for_llm_based_command_generator,
+            metrics_recorder=record_compact_llm_command_generator_metrics,
+        )
+        _instrument_method(
+            tracer_provider.get_tracer(compact_llm_command_generator_class.__module__),
+            compact_llm_command_generator_class,
+            "_check_commands_against_startable_flows",
+            attribute_extractors.extract_attrs_for_check_commands_against_startable_flows,
+        )
+        _instrument_perform_health_check_method_for_component(
+            tracer_provider.get_tracer(compact_llm_command_generator_class.__module__),
+            compact_llm_command_generator_class,
+            "perform_llm_health_check",
+            attribute_extractors.extract_attrs_for_performing_health_check,
+        )
+        mark_class_as_instrumented(compact_llm_command_generator_class)
     if multi_step_llm_command_generator_class is not None and not class_is_instrumented(
         multi_step_llm_command_generator_class
     ):
@@ -526,6 +561,7 @@ def instrument(
             for llm_based_command_generator_class in (
                 llm_command_generator_class,
                 single_step_llm_command_generator_class,
+                compact_llm_command_generator_class,
                 multi_step_llm_command_generator_class,
             )
         )

rasa/tracing/instrumentation/metrics.py CHANGED Viewed

@@ -6,11 +6,16 @@ from rasa.core.nlg.contextual_response_rephraser import ContextualResponseRephra
 from rasa.core.policies.enterprise_search_policy import EnterpriseSearchPolicy
 from rasa.core.policies.intentless_policy import IntentlessPolicy
 from rasa.dialogue_understanding.generator import (
+    CompactLLMCommandGenerator,
     LLMCommandGenerator,
     MultiStepLLMCommandGenerator,
     SingleStepLLMCommandGenerator,
 )
 from rasa.tracing.constants import (
+    COMPACT_LLM_COMMAND_GENERATOR_CPU_USAGE_METRIC_NAME,
+    COMPACT_LLM_COMMAND_GENERATOR_LLM_RESPONSE_DURATION_METRIC_NAME,
+    COMPACT_LLM_COMMAND_GENERATOR_MEMORY_USAGE_METRIC_NAME,
+    COMPACT_LLM_COMMAND_GENERATOR_PROMPT_TOKEN_USAGE_METRIC_NAME,
     CONTEXTUAL_RESPONSE_REPHRASER_LLM_RESPONSE_DURATION_METRIC_NAME,
     ENTERPRISE_SEARCH_POLICY_LLM_RESPONSE_DURATION_METRIC_NAME,
     INTENTLESS_POLICY_LLM_RESPONSE_DURATION_METRIC_NAME,
@@ -170,6 +175,36 @@ def record_single_step_llm_command_generator_metrics(
     )
+def record_compact_llm_command_generator_metrics(
+    attributes: Dict[str, Any],
+) -> None:
+    """
+    Record measurements for CompactLLMCommandGenerator specific metrics.
+    The recording is done by the opentelemetry.metrics.Histogram instruments.
+    These instruments are registered to the MetricInstrumentProvider internal singleton.
+    :param attributes: Extracted tracing attributes
+    :return: None
+    """
+    instrument_provider = MetricInstrumentProvider()
+    if not instrument_provider.instruments:
+        return None
+    record_llm_based_command_generator_cpu_usage(
+        instrument_provider, COMPACT_LLM_COMMAND_GENERATOR_CPU_USAGE_METRIC_NAME
+    )
+    record_llm_based_command_generator_memory_usage(
+        instrument_provider, COMPACT_LLM_COMMAND_GENERATOR_MEMORY_USAGE_METRIC_NAME
+    )
+    record_llm_based_command_generator_prompt_token(
+        instrument_provider,
+        attributes,
+        COMPACT_LLM_COMMAND_GENERATOR_PROMPT_TOKEN_USAGE_METRIC_NAME,
+    )
 def record_multi_step_llm_command_generator_metrics(attributes: Dict[str, Any]) -> None:
     """
     Record measurements for MultiStepLLMCommandGenerator specific metrics.
@@ -205,6 +240,7 @@ def record_callable_duration_metrics(
     Record duration of instrumented method calls invoked for the following components:
     - LLMCommandGenerator
     - SingleStepLLMCommandGenerator
+    - CompactLLMCommandGenerator
     - MultiStepLLMCommandGenerator
     - EnterpriseSearchPolicy
     - IntentlessPolicy
@@ -235,6 +271,11 @@ def record_callable_duration_metrics(
             SINGLE_STEP_LLM_COMMAND_GENERATOR_LLM_RESPONSE_DURATION_METRIC_NAME
         )
+    if type(self) == CompactLLMCommandGenerator:
+        metric_instrument = instrument_provider.get_instrument(
+            COMPACT_LLM_COMMAND_GENERATOR_LLM_RESPONSE_DURATION_METRIC_NAME
+        )
     if type(self) == MultiStepLLMCommandGenerator:
         metric_instrument = instrument_provider.get_instrument(
             MULTI_STEP_LLM_COMMAND_GENERATOR_LLM_RESPONSE_DURATION_METRIC_NAME

rasa/tracing/metric_instrument_provider.py CHANGED Viewed

@@ -4,6 +4,10 @@ from opentelemetry.metrics import get_meter_provider
 from opentelemetry.sdk.metrics import Meter
 from rasa.tracing.constants import (
+    COMPACT_LLM_COMMAND_GENERATOR_CPU_USAGE_METRIC_NAME,
+    COMPACT_LLM_COMMAND_GENERATOR_LLM_RESPONSE_DURATION_METRIC_NAME,
+    COMPACT_LLM_COMMAND_GENERATOR_MEMORY_USAGE_METRIC_NAME,
+    COMPACT_LLM_COMMAND_GENERATOR_PROMPT_TOKEN_USAGE_METRIC_NAME,
     CONTEXTUAL_RESPONSE_REPHRASER_LLM_RESPONSE_DURATION_METRIC_NAME,
     DURATION_UNIT_NAME,
     ENTERPRISE_SEARCH_POLICY_LLM_RESPONSE_DURATION_METRIC_NAME,
@@ -43,6 +47,7 @@ class MetricInstrumentProvider(metaclass=Singleton):
         instruments = {
             **self._create_llm_command_generator_instruments(meter),
             **self._create_single_step_llm_command_generator_instruments(meter),
+            **self._create_compact_llm_command_generator_instruments(meter),
             **self._create_multi_step_llm_command_generator_instruments(meter),
             **self._create_llm_response_duration_instruments(meter),
             **self._create_client_request_instruments(meter),
@@ -122,6 +127,41 @@ class MetricInstrumentProvider(metaclass=Singleton):
             SINGLE_STEP_LLM_COMMAND_GENERATOR_LLM_RESPONSE_DURATION_METRIC_NAME: single_step_llm_response_duration_llm_command_generator,  # noqa: E501
         }
+    @staticmethod
+    def _create_compact_llm_command_generator_instruments(
+        meter: Meter,
+    ) -> Dict[str, Any]:
+        compact_llm_command_generator_cpu_usage = meter.create_histogram(
+            name=COMPACT_LLM_COMMAND_GENERATOR_CPU_USAGE_METRIC_NAME,
+            description="CPU percentage for CompactLLMCommandGenerator",
+            unit=LLM_BASED_COMMAND_GENERATOR_CPU_MEMORY_USAGE_UNIT_NAME,
+        )
+        compact_llm_command_generator_memory_usage = meter.create_histogram(
+            name=COMPACT_LLM_COMMAND_GENERATOR_MEMORY_USAGE_METRIC_NAME,
+            description="RAM memory usage for CompactLLMCommandGenerator",
+            unit=LLM_BASED_COMMAND_GENERATOR_CPU_MEMORY_USAGE_UNIT_NAME,
+        )
+        compact_llm_command_generator_prompt_token_usage = meter.create_histogram(
+            name=COMPACT_LLM_COMMAND_GENERATOR_PROMPT_TOKEN_USAGE_METRIC_NAME,
+            description="CompactLLMCommandGenerator prompt token length",
+            unit="1",
+        )
+        compact_llm_response_duration_llm_command_generator = meter.create_histogram(
+            name=COMPACT_LLM_COMMAND_GENERATOR_LLM_RESPONSE_DURATION_METRIC_NAME,
+            description="The duration of CompactLLMCommandGenerator's LLM call",
+            unit=DURATION_UNIT_NAME,
+        )
+        return {
+            COMPACT_LLM_COMMAND_GENERATOR_CPU_USAGE_METRIC_NAME: compact_llm_command_generator_cpu_usage,  # noqa: E501
+            COMPACT_LLM_COMMAND_GENERATOR_MEMORY_USAGE_METRIC_NAME: compact_llm_command_generator_memory_usage,  # noqa: E501
+            COMPACT_LLM_COMMAND_GENERATOR_PROMPT_TOKEN_USAGE_METRIC_NAME: compact_llm_command_generator_prompt_token_usage,  # noqa: E501
+            COMPACT_LLM_COMMAND_GENERATOR_LLM_RESPONSE_DURATION_METRIC_NAME: compact_llm_response_duration_llm_command_generator,  # noqa: E501
+        }
     @staticmethod
     def _create_multi_step_llm_command_generator_instruments(
         meter: Meter,

rasa/utils/common.py CHANGED Viewed

@@ -70,7 +70,6 @@ EXPECTED_WARNINGS: List[Tuple[Type[Warning], str]] = [
         "Converting sparse IndexedSlices.* to a dense Tensor of unknown "
         "shape. This may consume a large amount of memory.",
     ),
-    (UserWarning, "Slot auto-fill has been removed in 3.0 .*"),
     # Cannot fix this deprecation warning since we need to support two
     # numpy versions as long as we keep python 37 around
     (DeprecationWarning, "the `interpolation=` argument to quantile was renamed"),

rasa-pro 3.12.0.dev12__py3-none-any.whl → 3.12.0rc1__py3-none-any.whl

Potentially problematic release.

rasa-pro 3.12.0.dev12py3-none-any.whl → 3.12.0rc1py3-none-any.whl