PyPI - rasa-pro - Versions diffs - 3.13.0.dev7__py3-none-any.whl → 3.13.0.dev8__py3-none-any.whl - Mend

rasa-pro 3.13.0.dev7py3-none-any.whl → 3.13.0.dev8py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of rasa-pro might be problematic. Click here for more details.

Files changed (150) hide show

rasa/__main__.py +0 -3
rasa/api.py +1 -1
rasa/cli/dialogue_understanding_test.py +1 -1
rasa/cli/e2e_test.py +1 -1
rasa/cli/evaluate.py +1 -1
rasa/cli/export.py +1 -1
rasa/cli/llm_fine_tuning.py +12 -11
rasa/cli/project_templates/defaults.py +133 -0
rasa/cli/run.py +1 -1
rasa/cli/studio/link.py +53 -0
rasa/cli/studio/pull.py +78 -0
rasa/cli/studio/push.py +78 -0
rasa/cli/studio/studio.py +12 -0
rasa/cli/studio/upload.py +8 -0
rasa/cli/train.py +1 -1
rasa/cli/utils.py +1 -1
rasa/cli/x.py +1 -1
rasa/constants.py +2 -0
rasa/core/__init__.py +0 -16
rasa/core/actions/action.py +5 -1
rasa/core/actions/action_repeat_bot_messages.py +18 -22
rasa/core/actions/action_run_slot_rejections.py +0 -1
rasa/core/agent.py +16 -1
rasa/core/available_endpoints.py +146 -0
rasa/core/brokers/pika.py +1 -2
rasa/core/channels/botframework.py +2 -2
rasa/core/channels/channel.py +2 -2
rasa/core/channels/hangouts.py +8 -5
rasa/core/channels/mattermost.py +1 -1
rasa/core/channels/rasa_chat.py +2 -4
rasa/core/channels/rest.py +5 -4
rasa/core/channels/studio_chat.py +3 -2
rasa/core/channels/vier_cvg.py +1 -2
rasa/core/channels/voice_ready/audiocodes.py +1 -8
rasa/core/channels/voice_stream/audiocodes.py +7 -4
rasa/core/channels/voice_stream/genesys.py +2 -2
rasa/core/channels/voice_stream/twilio_media_streams.py +10 -5
rasa/core/channels/voice_stream/voice_channel.py +33 -22
rasa/core/http_interpreter.py +3 -7
rasa/core/jobs.py +2 -1
rasa/core/nlg/contextual_response_rephraser.py +34 -9
rasa/core/nlg/generator.py +0 -1
rasa/core/nlg/interpolator.py +2 -3
rasa/core/nlg/summarize.py +39 -5
rasa/core/policies/enterprise_search_policy.py +283 -62
rasa/core/policies/enterprise_search_prompt_with_relevancy_check_and_citation_template.jinja2 +63 -0
rasa/core/policies/flow_policy.py +1 -1
rasa/core/policies/flows/flow_executor.py +96 -17
rasa/core/policies/intentless_policy.py +9 -7
rasa/core/processor.py +104 -51
rasa/core/run.py +33 -11
rasa/core/tracker_stores/tracker_store.py +1 -1
rasa/core/training/interactive.py +1 -1
rasa/core/utils.py +24 -97
rasa/dialogue_understanding/coexistence/intent_based_router.py +2 -1
rasa/dialogue_understanding/commands/can_not_handle_command.py +2 -0
rasa/dialogue_understanding/commands/cancel_flow_command.py +2 -0
rasa/dialogue_understanding/commands/chit_chat_answer_command.py +2 -0
rasa/dialogue_understanding/commands/clarify_command.py +5 -1
rasa/dialogue_understanding/commands/command_syntax_manager.py +1 -0
rasa/dialogue_understanding/commands/human_handoff_command.py +2 -0
rasa/dialogue_understanding/commands/knowledge_answer_command.py +4 -2
rasa/dialogue_understanding/commands/repeat_bot_messages_command.py +2 -0
rasa/dialogue_understanding/commands/set_slot_command.py +11 -1
rasa/dialogue_understanding/commands/skip_question_command.py +2 -0
rasa/dialogue_understanding/commands/start_flow_command.py +4 -0
rasa/dialogue_understanding/commands/utils.py +26 -2
rasa/dialogue_understanding/generator/__init__.py +7 -1
rasa/dialogue_understanding/generator/command_generator.py +4 -2
rasa/dialogue_understanding/generator/command_parser.py +2 -2
rasa/dialogue_understanding/generator/command_parser_validator.py +63 -0
rasa/dialogue_understanding/generator/prompt_templates/command_prompt_v2_gpt_4o_2024_11_20_template.jinja2 +12 -33
rasa/dialogue_understanding/generator/prompt_templates/command_prompt_v3_gpt_4o_2024_11_20_template.jinja2 +78 -0
rasa/dialogue_understanding/generator/single_step/compact_llm_command_generator.py +26 -461
rasa/dialogue_understanding/generator/single_step/search_ready_llm_command_generator.py +147 -0
rasa/dialogue_understanding/generator/single_step/single_step_based_llm_command_generator.py +477 -0
rasa/dialogue_understanding/generator/single_step/single_step_llm_command_generator.py +8 -58
rasa/dialogue_understanding/patterns/default_flows_for_patterns.yml +37 -25
rasa/dialogue_understanding/patterns/domain_for_patterns.py +190 -0
rasa/dialogue_understanding/processor/command_processor.py +3 -3
rasa/dialogue_understanding/processor/command_processor_component.py +3 -3
rasa/dialogue_understanding/stack/frames/flow_stack_frame.py +17 -4
rasa/dialogue_understanding/utils.py +68 -12
rasa/dialogue_understanding_test/du_test_case.py +1 -1
rasa/dialogue_understanding_test/du_test_runner.py +4 -22
rasa/dialogue_understanding_test/test_case_simulation/test_case_tracker_simulator.py +2 -6
rasa/e2e_test/e2e_test_runner.py +1 -1
rasa/engine/constants.py +1 -1
rasa/engine/recipes/default_recipe.py +26 -2
rasa/engine/validation.py +3 -2
rasa/hooks.py +0 -28
rasa/llm_fine_tuning/annotation_module.py +39 -9
rasa/llm_fine_tuning/conversations.py +3 -0
rasa/llm_fine_tuning/llm_data_preparation_module.py +66 -49
rasa/llm_fine_tuning/paraphrasing/rephrase_validator.py +52 -44
rasa/llm_fine_tuning/paraphrasing_module.py +10 -12
rasa/llm_fine_tuning/storage.py +4 -4
rasa/llm_fine_tuning/utils.py +63 -1
rasa/model_manager/model_api.py +88 -0
rasa/model_manager/trainer_service.py +4 -4
rasa/plugin.py +1 -11
rasa/privacy/__init__.py +0 -0
rasa/privacy/constants.py +83 -0
rasa/privacy/event_broker_utils.py +77 -0
rasa/privacy/privacy_config.py +281 -0
rasa/privacy/privacy_config_schema.json +86 -0
rasa/privacy/privacy_filter.py +340 -0
rasa/privacy/privacy_manager.py +576 -0
rasa/server.py +23 -2
rasa/shared/constants.py +3 -0
rasa/shared/core/constants.py +4 -3
rasa/shared/core/domain.py +7 -0
rasa/shared/core/events.py +37 -7
rasa/shared/core/flows/flow.py +1 -2
rasa/shared/core/flows/flows_yaml_schema.json +3 -0
rasa/shared/core/flows/steps/collect.py +46 -2
rasa/shared/core/slots.py +28 -0
rasa/shared/exceptions.py +4 -0
rasa/shared/utils/llm.py +161 -6
rasa/shared/utils/yaml.py +32 -0
rasa/studio/data_handler.py +3 -3
rasa/studio/download/download.py +37 -60
rasa/studio/download/flows.py +23 -31
rasa/studio/link.py +200 -0
rasa/studio/pull.py +94 -0
rasa/studio/push.py +131 -0
rasa/studio/upload.py +117 -67
rasa/telemetry.py +82 -25
rasa/tracing/config.py +3 -4
rasa/tracing/constants.py +19 -1
rasa/tracing/instrumentation/attribute_extractors.py +10 -2
rasa/tracing/instrumentation/instrumentation.py +53 -2
rasa/tracing/instrumentation/metrics.py +98 -15
rasa/tracing/metric_instrument_provider.py +75 -3
rasa/utils/common.py +1 -27
rasa/utils/log_utils.py +1 -45
rasa/validator.py +2 -8
rasa/version.py +1 -1
{rasa_pro-3.13.0.dev7.dist-info → rasa_pro-3.13.0.dev8.dist-info}/METADATA +5 -6
{rasa_pro-3.13.0.dev7.dist-info → rasa_pro-3.13.0.dev8.dist-info}/RECORD +143 -129
rasa/anonymization/__init__.py +0 -2
rasa/anonymization/anonymisation_rule_yaml_reader.py +0 -91
rasa/anonymization/anonymization_pipeline.py +0 -286
rasa/anonymization/anonymization_rule_executor.py +0 -266
rasa/anonymization/anonymization_rule_orchestrator.py +0 -119
rasa/anonymization/schemas/config.yml +0 -47
rasa/anonymization/utils.py +0 -118
{rasa_pro-3.13.0.dev7.dist-info → rasa_pro-3.13.0.dev8.dist-info}/NOTICE +0 -0
{rasa_pro-3.13.0.dev7.dist-info → rasa_pro-3.13.0.dev8.dist-info}/WHEEL +0 -0
{rasa_pro-3.13.0.dev7.dist-info → rasa_pro-3.13.0.dev8.dist-info}/entry_points.txt +0 -0

rasa/core/policies/enterprise_search_policy.py CHANGED Viewed

@@ -1,7 +1,8 @@
+import dataclasses
 import importlib.resources
 import json
 import re
-from typing import TYPE_CHECKING, Any, Dict, List, Optional, Text
+from typing import TYPE_CHECKING, Any, Dict, List, Literal, Optional, Text
 import dotenv
 import structlog
@@ -9,6 +10,7 @@ from jinja2 import Template
 from pydantic import ValidationError
 import rasa.shared.utils.io
+from rasa.core.available_endpoints import AvailableEndpoints
 from rasa.core.constants import (
     POLICY_MAX_HISTORY,
     POLICY_PRIORITY,
@@ -23,7 +25,6 @@ from rasa.core.information_retrieval import (
 )
 from rasa.core.information_retrieval.faiss import FAISS_Store
 from rasa.core.policies.policy import Policy, PolicyPrediction
-from rasa.core.utils import AvailableEndpoints
 from rasa.dialogue_understanding.generator.constants import (
     LLM_CONFIG_KEY,
 )
@@ -53,7 +54,9 @@ from rasa.shared.constants import (
     MODEL_NAME_CONFIG_KEY,
     OPENAI_PROVIDER,
     PROMPT_CONFIG_KEY,
+    PROMPT_TEMPLATE_CONFIG_KEY,
     PROVIDER_CONFIG_KEY,
+    RASA_PATTERN_CANNOT_HANDLE_NO_RELEVANT_ANSWER,
     TEMPERATURE_CONFIG_KEY,
     TIMEOUT_CONFIG_KEY,
 )
@@ -78,7 +81,6 @@ from rasa.shared.nlu.training_data.training_data import TrainingData
 from rasa.shared.providers.embedding._langchain_embedding_client_adapter import (
     _LangchainEmbeddingClientAdapter,
 )
-from rasa.shared.providers.llm.llm_client import LLMClient
 from rasa.shared.providers.llm.llm_response import LLMResponse, measure_llm_latency
 from rasa.shared.utils.cli import print_error_and_exit
 from rasa.shared.utils.constants import (
@@ -113,7 +115,7 @@ if TYPE_CHECKING:
 from rasa.utils.log_utils import log_llm
-logger = structlog.get_logger()
+structlogger = structlog.get_logger()
 dotenv.load_dotenv("./.env")
@@ -124,6 +126,7 @@ VECTOR_STORE_THRESHOLD_PROPERTY = "threshold"
 TRACE_TOKENS_PROPERTY = "trace_prompt_tokens"
 CITATION_ENABLED_PROPERTY = "citation_enabled"
 USE_LLM_PROPERTY = "use_generative_llm"
+CHECK_RELEVANCY_PROPERTY = "check_relevancy"
 MAX_MESSAGES_IN_QUERY_KEY = "max_messages_in_query"
 DEFAULT_VECTOR_STORE_TYPE = "faiss"
@@ -134,6 +137,10 @@ DEFAULT_VECTOR_STORE = {
     VECTOR_STORE_THRESHOLD_PROPERTY: DEFAULT_VECTOR_STORE_THRESHOLD,
 }
+DEFAULT_CHECK_RELEVANCY_PROPERTY = False
+DEFAULT_USE_LLM_PROPERTY = True
+DEFAULT_CITATION_ENABLED_PROPERTY = False
 DEFAULT_LLM_CONFIG = {
     PROVIDER_CONFIG_KEY: OPENAI_PROVIDER,
     MODEL_CONFIG_KEY: DEFAULT_OPENAI_CHAT_MODEL_NAME,
@@ -162,6 +169,18 @@ DEFAULT_ENTERPRISE_SEARCH_PROMPT_WITH_CITATION_TEMPLATE = importlib.resources.re
     "rasa.core.policies", "enterprise_search_prompt_with_citation_template.jinja2"
 )
+DEFAULT_ENTERPRISE_SEARCH_PROMPT_WITH_RELEVANCY_CHECK_AND_CITATION_TEMPLATE = (
+    importlib.resources.read_text(
+        "rasa.core.policies",
+        "enterprise_search_prompt_with_relevancy_check_and_citation_template.jinja2",
+    )
+)
+# TODO: Update this pattern once the experiments are done
+_ENTERPRISE_SEARCH_ANSWER_NOT_RELEVANT_PATTERN = re.compile(
+    r"\[NO_RELEVANT_ANSWER_FOUND\]"
+)
 class VectorStoreConnectionError(RasaException):
     """Exception raised for errors in connecting to the vector store."""
@@ -171,6 +190,12 @@ class VectorStoreConfigurationError(RasaException):
     """Exception raised for errors in vector store configuration."""
+@dataclasses.dataclass
+class _RelevancyCheckResponse:
+    answer: Optional[str]
+    relevant: bool
 @DefaultV1Recipe.register(
     DefaultV1Recipe.ComponentType.POLICY_WITH_END_TO_END_SUPPORT, is_trainable=True
 )
@@ -220,6 +245,11 @@ class EnterpriseSearchPolicy(LLMHealthCheckMixin, EmbeddingsHealthCheckMixin, Po
         """Constructs a new Policy object."""
         super().__init__(config, model_storage, resource, execution_context, featurizer)
+        # Check for deprecated keys and issue a warning if those are used
+        self._check_config_keys_and_warn_if_deprecated()
+        # Check for mutual exclusivity of extractive and generative search
+        self._check_and_warn_mutual_exclusivity_of_extractive_and_generative_search()
         # Resolve LLM config
         self.config[LLM_CONFIG_KEY] = resolve_model_client_config(
             self.config.get(LLM_CONFIG_KEY), EnterpriseSearchPolicy.__name__
@@ -234,6 +264,9 @@ class EnterpriseSearchPolicy(LLMHealthCheckMixin, EmbeddingsHealthCheckMixin, Po
         self.vector_store_config = self.config.get(
             VECTOR_STORE_PROPERTY, DEFAULT_VECTOR_STORE
         )
+        self.vector_search_threshold = self.vector_store_config.get(
+            VECTOR_STORE_THRESHOLD_PROPERTY, DEFAULT_VECTOR_STORE_THRESHOLD
+        )
         # Embeddings configuration for encoding the search query
         self.embeddings_config = (
@@ -249,30 +282,77 @@ class EnterpriseSearchPolicy(LLMHealthCheckMixin, EmbeddingsHealthCheckMixin, Po
         # Maximum number of messages to include in the search query
         self.max_messages_in_query = self.config.get(MAX_MESSAGES_IN_QUERY_KEY, 2)
-        # boolean to enable/disable tracing of prompt tokens
+        # Boolean to enable/disable tracing of prompt tokens
         self.trace_prompt_tokens = self.config.get(TRACE_TOKENS_PROPERTY, False)
-        # boolean to enable/disable the use of LLM for response generation
-        self.use_llm = self.config.get(USE_LLM_PROPERTY, True)
+        # Boolean to enable/disable the use of LLM for response generation
+        self.use_llm = self.config.get(USE_LLM_PROPERTY, DEFAULT_USE_LLM_PROPERTY)
-        # boolean to enable/disable citation generation
-        self.citation_enabled = self.config.get(CITATION_ENABLED_PROPERTY, False)
+        # Boolean to enable/disable citation generation. This flag enables citation
+        # logic, but it only takes effect if `use_llm` is True.
+        self.citation_enabled = self.config.get(
+            CITATION_ENABLED_PROPERTY, DEFAULT_CITATION_ENABLED_PROPERTY
+        )
-        self.prompt_template = prompt_template or get_prompt_template(
-            self.config.get(PROMPT_CONFIG_KEY),
-            DEFAULT_ENTERPRISE_SEARCH_PROMPT_TEMPLATE,
-            log_source_component=EnterpriseSearchPolicy.__name__,
-            log_source_method=LOG_COMPONENT_SOURCE_METHOD_INIT,
+        # Boolean to enable/disable the use of relevancy check alongside answer
+        # generation. This flag enables citation logic, but it only takes effect if
+        # `use_llm` is True.
+        self.relevancy_check_enabled = self.config.get(
+            CHECK_RELEVANCY_PROPERTY, DEFAULT_CHECK_RELEVANCY_PROPERTY
         )
-        self.citation_prompt_template = get_prompt_template(
-            self.config.get(PROMPT_CONFIG_KEY),
-            DEFAULT_ENTERPRISE_SEARCH_PROMPT_WITH_CITATION_TEMPLATE,
-            log_source_component=EnterpriseSearchPolicy.__name__,
-            log_source_method=LOG_COMPONENT_SOURCE_METHOD_INIT,
+        # Resolve the prompt template. The prompt will only be used if the 'use_llm' is
+        # set to True.
+        self.prompt_template = prompt_template or self._resolve_prompt_template(
+            self.config, LOG_COMPONENT_SOURCE_METHOD_INIT
         )
-        # If citation is enabled, use the citation prompt template
-        if self.citation_enabled:
-            self.prompt_template = self.citation_prompt_template
+    def _check_config_keys_and_warn_if_deprecated(self) -> None:
+        """Checks and warns about deprecated config parameters."""
+        if (
+            PROMPT_CONFIG_KEY in self.config
+            and PROMPT_TEMPLATE_CONFIG_KEY in self.config
+        ):
+            structlogger.warning(
+                "enterprise_search_policy.init"
+                ".both_deprecated_and_non_deprecated_config_keys_used_at_the_same_time",
+                event_info=(
+                    f"Both '{PROMPT_CONFIG_KEY}' and '{PROMPT_TEMPLATE_CONFIG_KEY}' "
+                    f"are present in the config. '{PROMPT_CONFIG_KEY}' will be ignored "
+                    f"in favor of {PROMPT_TEMPLATE_CONFIG_KEY}."
+                ),
+            )
+        # 'prompt' config key is deprecated in favor of 'prompt_template'
+        if PROMPT_CONFIG_KEY in self.config:
+            structlogger.warning(
+                "enterprise_search_policy.init.deprecated_config_key",
+                event_info=(
+                    f"The config parameter '{PROMPT_CONFIG_KEY}' is deprecated "
+                    "and will be removed in Rasa 4.0.0. "
+                    f"Please use the config parameter '{PROMPT_TEMPLATE_CONFIG_KEY}'"
+                    f"instead. "
+                ),
+            )
+    def _check_and_warn_mutual_exclusivity_of_extractive_and_generative_search(
+        self,
+    ) -> None:
+        if self.config.get(
+            CHECK_RELEVANCY_PROPERTY, DEFAULT_CHECK_RELEVANCY_PROPERTY
+        ) and not self.config.get(USE_LLM_PROPERTY, DEFAULT_USE_LLM_PROPERTY):
+            structlogger.warning(
+                "enterprise_search_policy.init"
+                ".relevancy_check_enabled_with_disabled_generative_search",
+                event_info=(
+                    f"The config parameter '{CHECK_RELEVANCY_PROPERTY}' is set to"
+                    f"'True', but the generative search is disabled (config"
+                    f"parameter '{USE_LLM_PROPERTY}' is set to 'False'). As a result, "
+                    "the relevancy check for the generative search will be disabled. "
+                    f"To use this check, set the config parameter '{USE_LLM_PROPERTY}' "
+                    f"to `True`."
+                ),
+            )
     @classmethod
     def _create_plain_embedder(cls, config: Dict[Text, Any]) -> "Embeddings":
@@ -366,7 +446,7 @@ class EnterpriseSearchPolicy(LLMHealthCheckMixin, EmbeddingsHealthCheckMixin, Po
         try:
             embeddings = self._create_plain_embedder(self.config)
         except (ValidationError, Exception) as e:
-            logger.error(
+            structlogger.error(
                 "enterprise_search_policy.train.embedder_instantiation_failed",
                 message="Unable to instantiate the embedding client.",
                 error=e,
@@ -377,7 +457,7 @@ class EnterpriseSearchPolicy(LLMHealthCheckMixin, EmbeddingsHealthCheckMixin, Po
             )
         if store_type == DEFAULT_VECTOR_STORE_TYPE:
-            logger.info("enterprise_search_policy.train.faiss")
+            structlogger.info("enterprise_search_policy.train.faiss")
             with self._model_storage.write_to(self._resource) as path:
                 self.vector_store = FAISS_Store(
                     docs_folder=self.vector_store_config.get(SOURCE_PROPERTY),
@@ -386,7 +466,9 @@ class EnterpriseSearchPolicy(LLMHealthCheckMixin, EmbeddingsHealthCheckMixin, Po
                     create_index=True,
                 )
         else:
-            logger.info("enterprise_search_policy.train.custom", store_type=store_type)
+            structlogger.info(
+                "enterprise_search_policy.train.custom", store_type=store_type
+            )
         # telemetry call to track training completion
         track_enterprise_search_policy_train_completed(
@@ -402,6 +484,7 @@ class EnterpriseSearchPolicy(LLMHealthCheckMixin, EmbeddingsHealthCheckMixin, Po
             or self.llm_config.get(MODEL_NAME_CONFIG_KEY),
             llm_model_group_id=self.llm_config.get(MODEL_GROUP_ID_CONFIG_KEY),
             citation_enabled=self.citation_enabled,
+            relevancy_check_enabled=self.relevancy_check_enabled,
         )
         self.persist()
         return self._resource
@@ -454,7 +537,7 @@ class EnterpriseSearchPolicy(LLMHealthCheckMixin, EmbeddingsHealthCheckMixin, Po
         config = endpoints.vector_store if endpoints else None
         store_type = self.vector_store_config.get(VECTOR_STORE_TYPE_PROPERTY)
         if config is None and store_type != DEFAULT_VECTOR_STORE_TYPE:
-            logger.error(
+            structlogger.error(
                 "enterprise_search_policy._connect_vector_store_or_raise.no_config"
             )
             raise VectorStoreConfigurationError(
@@ -464,7 +547,7 @@ class EnterpriseSearchPolicy(LLMHealthCheckMixin, EmbeddingsHealthCheckMixin, Po
         try:
             self.vector_store.connect(config)  # type: ignore
         except Exception as e:
-            logger.error(
+            structlogger.error(
                 "enterprise_search_policy._connect_vector_store_or_raise.connect_error",
                 error=e,
                 config=config,
@@ -490,14 +573,14 @@ class EnterpriseSearchPolicy(LLMHealthCheckMixin, EmbeddingsHealthCheckMixin, Po
                 transcript.append(sanitize_message_for_prompt(event.text))
         search_query = " ".join(transcript[-history:][::-1])
-        logger.debug("search_query", search_query=search_query)
+        structlogger.debug("search_query", search_query=search_query)
         return search_query
     async def predict_action_probabilities(  # type: ignore[override]
         self,
         tracker: DialogueStateTracker,
         domain: Domain,
-        endpoints: Optional[AvailableEndpoints],
+        endpoints: Optional[AvailableEndpoints] = None,
         rule_only_data: Optional[Dict[Text, Any]] = None,
         **kwargs: Any,
     ) -> PolicyPrediction:
@@ -516,23 +599,20 @@ class EnterpriseSearchPolicy(LLMHealthCheckMixin, EmbeddingsHealthCheckMixin, Po
              The prediction.
         """
         logger_key = "enterprise_search_policy.predict_action_probabilities"
-        vector_search_threshold = self.vector_store_config.get(
-            VECTOR_STORE_THRESHOLD_PROPERTY, DEFAULT_VECTOR_STORE_THRESHOLD
-        )
-        llm = llm_factory(self.config.get(LLM_CONFIG_KEY), DEFAULT_LLM_CONFIG)
         if not self.supports_current_stack_frame(
             tracker, False, False
         ) or self.should_abstain_in_coexistence(tracker, True):
             return self._prediction(self._default_predictions(domain))
         if not self.vector_store:
-            logger.error(f"{logger_key}.no_vector_store")
+            structlogger.error(f"{logger_key}.no_vector_store")
             return self._create_prediction_internal_error(domain, tracker)
         try:
             self._connect_vector_store_or_raise(endpoints)
         except (VectorStoreConfigurationError, VectorStoreConnectionError) as e:
-            logger.error(f"{logger_key}.connection_error", error=e)
+            structlogger.error(f"{logger_key}.connection_error", error=e)
             return self._create_prediction_internal_error(domain, tracker)
         search_query = self._prepare_search_query(
@@ -544,20 +624,19 @@ class EnterpriseSearchPolicy(LLMHealthCheckMixin, EmbeddingsHealthCheckMixin, Po
             documents = await self.vector_store.search(
                 query=search_query,
                 tracker_state=tracker_state,
-                threshold=vector_search_threshold,
+                threshold=self.vector_search_threshold,
             )
         except InformationRetrievalException as e:
-            logger.error(f"{logger_key}.search_error", error=e)
+            structlogger.error(f"{logger_key}.search_error", error=e)
             return self._create_prediction_internal_error(domain, tracker)
         if not documents.results:
-            logger.info(f"{logger_key}.no_documents")
+            structlogger.info(f"{logger_key}.no_documents")
             return self._create_prediction_cannot_handle(domain, tracker)
         if self.use_llm:
             prompt = self._render_prompt(tracker, documents.results)
-            llm_response = await self._generate_llm_answer(llm, prompt)
-            llm_response = LLMResponse.ensure_llm_response(llm_response)
+            llm_response = await self._invoke_llm(prompt)
             self._add_prompt_and_llm_response_to_latest_message(
                 tracker=tracker,
@@ -567,24 +646,38 @@ class EnterpriseSearchPolicy(LLMHealthCheckMixin, EmbeddingsHealthCheckMixin, Po
             )
             if llm_response is None or not llm_response.choices:
-                logger.debug(f"{logger_key}.no_llm_response")
+                structlogger.debug(f"{logger_key}.no_llm_response")
                 response = None
             else:
                 llm_answer = llm_response.choices[0]
+                if self.relevancy_check_enabled:
+                    relevancy_response = self._parse_llm_relevancy_check_response(
+                        llm_answer
+                    )
+                    if not relevancy_response.relevant:
+                        structlogger.debug(f"{logger_key}.answer_not_relevant")
+                        return self._create_prediction_cannot_handle(
+                            domain,
+                            tracker,
+                            RASA_PATTERN_CANNOT_HANDLE_NO_RELEVANT_ANSWER,
+                        )
                 if self.citation_enabled:
                     llm_answer = self.post_process_citations(llm_answer)
-                logger.debug(f"{logger_key}.llm_answer", llm_answer=llm_answer)
+                structlogger.debug(
+                    f"{logger_key}.llm_answer", prompt=prompt, llm_answer=llm_answer
+                )
                 response = llm_answer
         else:
             response = documents.results[0].metadata.get("answer", None)
             if not response:
-                logger.error(
+                structlogger.error(
                     f"{logger_key}.answer_key_missing_in_metadata",
                     search_results=documents.results,
                 )
-            logger.debug(
+            structlogger.debug(
                 "enterprise_search_policy.predict_action_probabilities.no_llm",
                 search_results=documents,
             )
@@ -616,6 +709,7 @@ class EnterpriseSearchPolicy(LLMHealthCheckMixin, EmbeddingsHealthCheckMixin, Po
             or self.llm_config.get(MODEL_NAME_CONFIG_KEY),
             llm_model_group_id=self.llm_config.get(MODEL_GROUP_ID_CONFIG_KEY),
             citation_enabled=self.citation_enabled,
+            relevancy_check_enabled=self.relevancy_check_enabled,
         )
         return self._create_prediction(
             domain=domain, tracker=tracker, action_metadata=action_metadata
@@ -639,11 +733,12 @@ class EnterpriseSearchPolicy(LLMHealthCheckMixin, EmbeddingsHealthCheckMixin, Po
             ),
             "docs": documents,
             "slots": self._prepare_slots_for_template(tracker),
+            "check_relevancy": self.relevancy_check_enabled,
             "citation_enabled": self.citation_enabled,
         }
         prompt = Template(self.prompt_template).render(**inputs)
         log_llm(
-            logger=logger,
+            logger=structlogger,
             log_module="EnterpriseSearchPolicy",
             log_event="enterprise_search_policy._render_prompt.prompt_rendered",
             prompt=prompt,
@@ -651,9 +746,7 @@ class EnterpriseSearchPolicy(LLMHealthCheckMixin, EmbeddingsHealthCheckMixin, Po
         return prompt
     @measure_llm_latency
-    async def _generate_llm_answer(
-        self, llm: LLMClient, prompt: Text
-    ) -> Optional[LLMResponse]:
+    async def _invoke_llm(self, prompt: Text) -> Optional[LLMResponse]:
         """Fetches an LLM completion for the provided prompt.
         Args:
@@ -663,17 +756,32 @@ class EnterpriseSearchPolicy(LLMHealthCheckMixin, EmbeddingsHealthCheckMixin, Po
         Returns:
             An LLMResponse object, or None if the call fails.
         """
+        llm = llm_factory(self.config.get(LLM_CONFIG_KEY), DEFAULT_LLM_CONFIG)
         try:
-            return await llm.acompletion(prompt)
+            response = await llm.acompletion(prompt)
+            return LLMResponse.ensure_llm_response(response)
         except Exception as e:
             # unfortunately, langchain does not wrap LLM exceptions which means
             # we have to catch all exceptions here
-            logger.error(
+            structlogger.error(
                 "enterprise_search_policy._generate_llm_answer.llm_error",
                 error=e,
             )
             return None
+    def _parse_llm_relevancy_check_response(
+        self, llm_answer: str
+    ) -> _RelevancyCheckResponse:
+        """Checks if the LLM response is relevant by parsing it."""
+        answer_relevant = not _ENTERPRISE_SEARCH_ANSWER_NOT_RELEVANT_PATTERN.search(
+            llm_answer
+        )
+        structlogger.debug("")
+        return _RelevancyCheckResponse(
+            answer=llm_answer if answer_relevant else None,
+            relevant=answer_relevant,
+        )
     def _create_prediction(
         self,
         domain: Domain,
@@ -708,10 +816,18 @@ class EnterpriseSearchPolicy(LLMHealthCheckMixin, EmbeddingsHealthCheckMixin, Po
         )
     def _create_prediction_cannot_handle(
-        self, domain: Domain, tracker: DialogueStateTracker
+        self,
+        domain: Domain,
+        tracker: DialogueStateTracker,
+        reason: Optional[str] = None,
     ) -> PolicyPrediction:
+        cannot_handle_stack_frame = (
+            CannotHandlePatternFlowStackFrame(reason=reason)
+            if reason is not None
+            else CannotHandlePatternFlowStackFrame()
+        )
         return self._create_prediction_for_pattern(
-            domain, tracker, CannotHandlePatternFlowStackFrame()
+            domain, tracker, cannot_handle_stack_frame
         )
     def _create_prediction_for_pattern(
@@ -780,7 +896,7 @@ class EnterpriseSearchPolicy(LLMHealthCheckMixin, EmbeddingsHealthCheckMixin, Po
                     path / ENTERPRISE_SEARCH_PROMPT_FILE_NAME
                 )
         except (FileNotFoundError, FileIOException) as e:
-            logger.warning(
+            structlogger.warning(
                 "enterprise_search_policy.load.failed", error=e, resource=resource.name
             )
@@ -790,7 +906,7 @@ class EnterpriseSearchPolicy(LLMHealthCheckMixin, EmbeddingsHealthCheckMixin, Po
         embeddings = cls._create_plain_embedder(config)
-        logger.info("enterprise_search_policy.load", config=config)
+        structlogger.info("enterprise_search_policy.load", config=config)
         if store_type == DEFAULT_VECTOR_STORE_TYPE:
             # if a vector store is not specified,
             # default to using FAISS with the index stored in the model
@@ -849,15 +965,12 @@ class EnterpriseSearchPolicy(LLMHealthCheckMixin, EmbeddingsHealthCheckMixin, Po
     @classmethod
     def fingerprint_addon(cls, config: Dict[str, Any]) -> Optional[str]:
         """Add a fingerprint of enterprise search policy for the graph."""
-        local_knowledge_data = cls._get_local_knowledge_data(config)
-        prompt_template = get_prompt_template(
-            config.get(PROMPT_CONFIG_KEY),
-            DEFAULT_ENTERPRISE_SEARCH_PROMPT_TEMPLATE,
-            log_source_component=EnterpriseSearchPolicy.__name__,
-            log_source_method=LOG_COMPONENT_SOURCE_METHOD_FINGERPRINT_ADDON,
+        prompt_template = cls._resolve_prompt_template(
+            config, LOG_COMPONENT_SOURCE_METHOD_FINGERPRINT_ADDON
         )
+        local_knowledge_data = cls._get_local_knowledge_data(config)
         llm_config = resolve_model_client_config(
             config.get(LLM_CONFIG_KEY), EnterpriseSearchPolicy.__name__
         )
@@ -881,7 +994,7 @@ class EnterpriseSearchPolicy(LLMHealthCheckMixin, EmbeddingsHealthCheckMixin, Po
         Returns:
             The post-processed LLM answer.
         """
-        logger.debug(
+        structlogger.debug(
             "enterprise_search_policy.post_process_citations", llm_answer=llm_answer
         )
@@ -982,3 +1095,111 @@ class EnterpriseSearchPolicy(LLMHealthCheckMixin, EmbeddingsHealthCheckMixin, Po
             log_source_method,
             EnterpriseSearchPolicy.__name__,
         )
+    @classmethod
+    def get_system_default_prompt_based_on_config(cls, config: Dict[str, Any]) -> str:
+        """
+        Resolves the default prompt template for Enterprise Search Policy based on
+        the component's configuration.
+        - The old prompt is selected when both citation and relevancy check are either
+          disabled or not set in the configuration.
+        - The citation prompt is used when citation is enabled and relevancy check is
+          either disabled or not set in the configuration.
+        - The relevancy check prompt is only used when relevancy check is enabled.
+        Args:
+            config: The component's configuration.
+        Returns:
+            The resolved jinja prompt template as a string.
+        """
+        # Get the feature flags
+        citation_enabled = config.get(
+            CITATION_ENABLED_PROPERTY, DEFAULT_CITATION_ENABLED_PROPERTY
+        )
+        relevancy_check_enabled = config.get(
+            CHECK_RELEVANCY_PROPERTY, DEFAULT_CHECK_RELEVANCY_PROPERTY
+        )
+        # Based on the enabled features (citation, relevancy check) fetch the
+        # appropriate default prompt
+        default_prompt = cls._select_default_prompt_template_based_on_features(
+            relevancy_check_enabled, citation_enabled
+        )
+        return default_prompt
+    @classmethod
+    def _resolve_prompt_template(
+        cls,
+        config: dict,
+        log_source_method: Literal["init", "fingerprint"],
+    ) -> str:
+        """
+        Resolves the prompt template to use for the Enterprise Search Policy's
+        generative search.
+        Checks if a custom template is provided via component's configuration. If not,
+        it selects the appropriate default template based on the enabled features
+        (citation and relevancy check).
+        Args:
+            config: The component's configuration.
+            log_source_method: The name of the method or function emitting the log for
+                better traceability.
+        Returns:
+            The resolved jinja prompt template as a string.
+        """
+        # Read the template path from the configuration if available.
+        # The deprecated 'prompt' has a lower priority compared to 'prompt_template'
+        config_defined_prompt = (
+            config.get(PROMPT_TEMPLATE_CONFIG_KEY)
+            or config.get(PROMPT_CONFIG_KEY)
+            or None
+        )
+        # Select the default prompt based on the features set in the config.
+        default_prompt = cls.get_system_default_prompt_based_on_config(config)
+        return get_prompt_template(
+            config_defined_prompt,
+            default_prompt,
+            log_source_component=EnterpriseSearchPolicy.__name__,
+            log_source_method=log_source_method,
+        )
+    @classmethod
+    def _select_default_prompt_template_based_on_features(
+        cls,
+        relevancy_check_enabled: bool,
+        citation_enabled: bool,
+    ) -> str:
+        """
+        Returns the appropriate default prompt template based on the feature flags.
+        The selection follows this priority:
+        1. If relevancy check is enabled, return the prompt that includes both relevancy
+           and citation blocks.
+        2. If only citation is enabled, return the prompt with citation blocks.
+        3. Otherwise, fall back to the legacy default prompt template.
+        Args:
+            relevancy_check_enabled: Whether the LLM-generated answer should undergo
+                relevancy evaluation.
+            citation_enabled: Whether citations should be included in the generated
+                answer.
+        Returns:
+            The default prompt template corresponding to the enabled features.
+        """
+        if relevancy_check_enabled:
+            # ES prompt that has relevancy check and citations blocks
+            return DEFAULT_ENTERPRISE_SEARCH_PROMPT_WITH_RELEVANCY_CHECK_AND_CITATION_TEMPLATE  # noqa: E501
+        elif citation_enabled:
+            # ES prompt with citation's block - backward compatibility
+            return DEFAULT_ENTERPRISE_SEARCH_PROMPT_WITH_CITATION_TEMPLATE
+        else:
+            # Legacy ES prompt - backward compatibility
+            return DEFAULT_ENTERPRISE_SEARCH_PROMPT_TEMPLATE

rasa-pro 3.13.0.dev7__py3-none-any.whl → 3.13.0.dev8__py3-none-any.whl

Potentially problematic release.

rasa-pro 3.13.0.dev7py3-none-any.whl → 3.13.0.dev8py3-none-any.whl