PyPI - rasa-pro - Versions diffs - 3.8.18__py3-none-any.whl → 3.9.15__py3-none-any.whl - Mend

rasa-pro 3.8.18py3-none-any.whl → 3.9.15py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of rasa-pro might be problematic. Click here for more details.

Files changed (278) hide show

README.md +6 -42
rasa/__main__.py +14 -9
rasa/anonymization/anonymization_pipeline.py +0 -1
rasa/anonymization/anonymization_rule_executor.py +3 -3
rasa/anonymization/utils.py +4 -3
rasa/api.py +2 -2
rasa/cli/arguments/default_arguments.py +1 -1
rasa/cli/arguments/run.py +2 -2
rasa/cli/arguments/test.py +1 -1
rasa/cli/arguments/train.py +10 -10
rasa/cli/e2e_test.py +27 -7
rasa/cli/export.py +0 -1
rasa/cli/license.py +3 -3
rasa/cli/project_templates/calm/actions/action_template.py +1 -1
rasa/cli/project_templates/calm/config.yml +1 -1
rasa/cli/project_templates/calm/credentials.yml +1 -1
rasa/cli/project_templates/calm/data/flows/add_contact.yml +1 -1
rasa/cli/project_templates/calm/data/flows/remove_contact.yml +1 -1
rasa/cli/project_templates/calm/domain/add_contact.yml +8 -2
rasa/cli/project_templates/calm/domain/list_contacts.yml +3 -0
rasa/cli/project_templates/calm/domain/remove_contact.yml +9 -2
rasa/cli/project_templates/calm/domain/shared.yml +5 -0
rasa/cli/project_templates/calm/endpoints.yml +4 -4
rasa/cli/project_templates/default/actions/actions.py +1 -1
rasa/cli/project_templates/default/config.yml +5 -5
rasa/cli/project_templates/default/credentials.yml +1 -1
rasa/cli/project_templates/default/endpoints.yml +4 -4
rasa/cli/project_templates/default/tests/test_stories.yml +1 -1
rasa/cli/project_templates/tutorial/config.yml +1 -1
rasa/cli/project_templates/tutorial/credentials.yml +1 -1
rasa/cli/project_templates/tutorial/data/patterns.yml +6 -0
rasa/cli/project_templates/tutorial/domain.yml +4 -0
rasa/cli/project_templates/tutorial/endpoints.yml +6 -6
rasa/cli/run.py +0 -1
rasa/cli/scaffold.py +3 -2
rasa/cli/studio/download.py +11 -0
rasa/cli/studio/studio.py +180 -24
rasa/cli/studio/upload.py +0 -8
rasa/cli/telemetry.py +18 -6
rasa/cli/utils.py +21 -10
rasa/cli/x.py +3 -2
rasa/constants.py +1 -1
rasa/core/actions/action.py +90 -315
rasa/core/actions/action_exceptions.py +24 -0
rasa/core/actions/constants.py +3 -0
rasa/core/actions/custom_action_executor.py +188 -0
rasa/core/actions/forms.py +11 -7
rasa/core/actions/grpc_custom_action_executor.py +251 -0
rasa/core/actions/http_custom_action_executor.py +140 -0
rasa/core/actions/loops.py +3 -0
rasa/core/actions/two_stage_fallback.py +1 -1
rasa/core/agent.py +2 -4
rasa/core/brokers/pika.py +1 -2
rasa/core/channels/audiocodes.py +1 -1
rasa/core/channels/botframework.py +0 -1
rasa/core/channels/callback.py +0 -1
rasa/core/channels/console.py +6 -8
rasa/core/channels/development_inspector.py +1 -1
rasa/core/channels/facebook.py +0 -3
rasa/core/channels/hangouts.py +0 -6
rasa/core/channels/inspector/dist/assets/{arc-5623b6dc.js → arc-b6e548fe.js} +1 -1
rasa/core/channels/inspector/dist/assets/{c4Diagram-d0fbc5ce-685c106a.js → c4Diagram-d0fbc5ce-fa03ac9e.js} +1 -1
rasa/core/channels/inspector/dist/assets/{classDiagram-936ed81e-8cbed007.js → classDiagram-936ed81e-ee67392a.js} +1 -1
rasa/core/channels/inspector/dist/assets/{classDiagram-v2-c3cb15f1-5889cf12.js → classDiagram-v2-c3cb15f1-9b283fae.js} +1 -1
rasa/core/channels/inspector/dist/assets/{createText-62fc7601-24c249d7.js → createText-62fc7601-8b6fcc2a.js} +1 -1
rasa/core/channels/inspector/dist/assets/{edges-f2ad444c-7dd06a75.js → edges-f2ad444c-22e77f4f.js} +1 -1
rasa/core/channels/inspector/dist/assets/{erDiagram-9d236eb7-62c1e54c.js → erDiagram-9d236eb7-60ffc87f.js} +1 -1
rasa/core/channels/inspector/dist/assets/{flowDb-1972c806-ce49b86f.js → flowDb-1972c806-9dd802e4.js} +1 -1
rasa/core/channels/inspector/dist/assets/{flowDiagram-7ea5b25a-4067e48f.js → flowDiagram-7ea5b25a-5fa1912f.js} +1 -1
rasa/core/channels/inspector/dist/assets/flowDiagram-v2-855bc5b3-1844e5a5.js +1 -0
rasa/core/channels/inspector/dist/assets/{flowchart-elk-definition-abe16c3d-59fe4051.js → flowchart-elk-definition-abe16c3d-622a1fd2.js} +1 -1
rasa/core/channels/inspector/dist/assets/{ganttDiagram-9b5ea136-47e3a43b.js → ganttDiagram-9b5ea136-e285a63a.js} +1 -1
rasa/core/channels/inspector/dist/assets/{gitGraphDiagram-99d0ae7c-5a2ac0d9.js → gitGraphDiagram-99d0ae7c-f237bdca.js} +1 -1
rasa/core/channels/inspector/dist/assets/{index-2c4b9a3b-dfb8efc4.js → index-2c4b9a3b-4b03d70e.js} +1 -1
rasa/core/channels/inspector/dist/assets/{index-268a75c0.js → index-a5d3e69d.js} +4 -4
rasa/core/channels/inspector/dist/assets/{infoDiagram-736b4530-b0c470f2.js → infoDiagram-736b4530-72a0fa5f.js} +1 -1
rasa/core/channels/inspector/dist/assets/{journeyDiagram-df861f2b-2edb829a.js → journeyDiagram-df861f2b-82218c41.js} +1 -1
rasa/core/channels/inspector/dist/assets/{layout-b6873d69.js → layout-78cff630.js} +1 -1
rasa/core/channels/inspector/dist/assets/{line-1efc5781.js → line-5038b469.js} +1 -1
rasa/core/channels/inspector/dist/assets/{linear-661e9b94.js → linear-c4fc4098.js} +1 -1
rasa/core/channels/inspector/dist/assets/{mindmap-definition-beec6740-2d2e727f.js → mindmap-definition-beec6740-c33c8ea6.js} +1 -1
rasa/core/channels/inspector/dist/assets/{pieDiagram-dbbf0591-9d3ea93d.js → pieDiagram-dbbf0591-a8d03059.js} +1 -1
rasa/core/channels/inspector/dist/assets/{quadrantDiagram-4d7f4fd6-06a178a2.js → quadrantDiagram-4d7f4fd6-6a0e56b2.js} +1 -1
rasa/core/channels/inspector/dist/assets/{requirementDiagram-6fc4c22a-0bfedffc.js → requirementDiagram-6fc4c22a-2dc7c7bd.js} +1 -1
rasa/core/channels/inspector/dist/assets/{sankeyDiagram-8f13d901-d76d0a04.js → sankeyDiagram-8f13d901-2360fe39.js} +1 -1
rasa/core/channels/inspector/dist/assets/{sequenceDiagram-b655622a-37bb4341.js → sequenceDiagram-b655622a-41b9f9ad.js} +1 -1
rasa/core/channels/inspector/dist/assets/{stateDiagram-59f0c015-f52f7f57.js → stateDiagram-59f0c015-0aad326f.js} +1 -1
rasa/core/channels/inspector/dist/assets/{stateDiagram-v2-2b26beab-4a986a20.js → stateDiagram-v2-2b26beab-9847d984.js} +1 -1
rasa/core/channels/inspector/dist/assets/{styles-080da4f6-7dd9ae12.js → styles-080da4f6-564d890e.js} +1 -1
rasa/core/channels/inspector/dist/assets/{styles-3dcbcfbf-46e1ca14.js → styles-3dcbcfbf-38957613.js} +1 -1
rasa/core/channels/inspector/dist/assets/{styles-9c745c82-4a97439a.js → styles-9c745c82-f0fc6921.js} +1 -1
rasa/core/channels/inspector/dist/assets/{svgDrawCommon-4835440b-823917a3.js → svgDrawCommon-4835440b-ef3c5a77.js} +1 -1
rasa/core/channels/inspector/dist/assets/{timeline-definition-5b62e21b-9ea72896.js → timeline-definition-5b62e21b-bf3e91c1.js} +1 -1
rasa/core/channels/inspector/dist/assets/{xychartDiagram-2b33534f-b631a8b6.js → xychartDiagram-2b33534f-4d4026c0.js} +1 -1
rasa/core/channels/inspector/dist/index.html +1 -1
rasa/core/channels/inspector/src/components/DiagramFlow.tsx +10 -0
rasa/core/channels/inspector/src/helpers/formatters.test.ts +4 -7
rasa/core/channels/inspector/src/helpers/formatters.ts +3 -2
rasa/core/channels/rest.py +36 -21
rasa/core/channels/rocketchat.py +0 -1
rasa/core/channels/socketio.py +1 -1
rasa/core/channels/telegram.py +3 -3
rasa/core/channels/webexteams.py +0 -1
rasa/core/concurrent_lock_store.py +1 -1
rasa/core/evaluation/marker_base.py +1 -3
rasa/core/evaluation/marker_stats.py +1 -2
rasa/core/featurizers/single_state_featurizer.py +3 -26
rasa/core/featurizers/tracker_featurizers.py +18 -122
rasa/core/information_retrieval/__init__.py +7 -0
rasa/core/information_retrieval/faiss.py +9 -4
rasa/core/information_retrieval/information_retrieval.py +64 -7
rasa/core/information_retrieval/milvus.py +7 -14
rasa/core/information_retrieval/qdrant.py +8 -15
rasa/core/lock_store.py +0 -1
rasa/core/migrate.py +1 -2
rasa/core/nlg/callback.py +3 -4
rasa/core/policies/enterprise_search_policy.py +86 -22
rasa/core/policies/enterprise_search_prompt_template.jinja2 +4 -41
rasa/core/policies/enterprise_search_prompt_with_citation_template.jinja2 +60 -0
rasa/core/policies/flows/flow_executor.py +104 -2
rasa/core/policies/intentless_policy.py +7 -9
rasa/core/policies/memoization.py +3 -3
rasa/core/policies/policy.py +18 -9
rasa/core/policies/rule_policy.py +8 -11
rasa/core/policies/ted_policy.py +61 -88
rasa/core/policies/unexpected_intent_policy.py +8 -17
rasa/core/processor.py +136 -47
rasa/core/run.py +41 -25
rasa/core/secrets_manager/endpoints.py +2 -2
rasa/core/secrets_manager/vault.py +6 -8
rasa/core/test.py +3 -5
rasa/core/tracker_store.py +49 -14
rasa/core/train.py +1 -3
rasa/core/training/interactive.py +9 -6
rasa/core/utils.py +5 -10
rasa/dialogue_understanding/coexistence/intent_based_router.py +11 -4
rasa/dialogue_understanding/coexistence/llm_based_router.py +2 -3
rasa/dialogue_understanding/commands/__init__.py +4 -0
rasa/dialogue_understanding/commands/can_not_handle_command.py +9 -0
rasa/dialogue_understanding/commands/cancel_flow_command.py +9 -0
rasa/dialogue_understanding/commands/change_flow_command.py +38 -0
rasa/dialogue_understanding/commands/chit_chat_answer_command.py +9 -0
rasa/dialogue_understanding/commands/clarify_command.py +9 -0
rasa/dialogue_understanding/commands/correct_slots_command.py +9 -0
rasa/dialogue_understanding/commands/error_command.py +12 -0
rasa/dialogue_understanding/commands/handle_code_change_command.py +9 -0
rasa/dialogue_understanding/commands/human_handoff_command.py +9 -0
rasa/dialogue_understanding/commands/knowledge_answer_command.py +9 -0
rasa/dialogue_understanding/commands/noop_command.py +9 -0
rasa/dialogue_understanding/commands/set_slot_command.py +38 -3
rasa/dialogue_understanding/commands/skip_question_command.py +9 -0
rasa/dialogue_understanding/commands/start_flow_command.py +9 -0
rasa/dialogue_understanding/generator/__init__.py +16 -1
rasa/dialogue_understanding/generator/command_generator.py +92 -6
rasa/dialogue_understanding/generator/constants.py +18 -0
rasa/dialogue_understanding/generator/flow_retrieval.py +7 -5
rasa/dialogue_understanding/generator/llm_based_command_generator.py +467 -0
rasa/dialogue_understanding/generator/llm_command_generator.py +39 -609
rasa/dialogue_understanding/generator/multi_step/__init__.py +0 -0
rasa/dialogue_understanding/generator/multi_step/fill_slots_prompt.jinja2 +62 -0
rasa/dialogue_understanding/generator/multi_step/handle_flows_prompt.jinja2 +38 -0
rasa/dialogue_understanding/generator/multi_step/multi_step_llm_command_generator.py +827 -0
rasa/dialogue_understanding/generator/nlu_command_adapter.py +69 -8
rasa/dialogue_understanding/generator/single_step/__init__.py +0 -0
rasa/dialogue_understanding/generator/single_step/single_step_llm_command_generator.py +345 -0
rasa/dialogue_understanding/patterns/default_flows_for_patterns.yml +36 -31
rasa/dialogue_understanding/processor/command_processor.py +112 -3
rasa/e2e_test/constants.py +1 -0
rasa/e2e_test/e2e_test_case.py +44 -0
rasa/e2e_test/e2e_test_runner.py +114 -11
rasa/e2e_test/e2e_test_schema.yml +18 -0
rasa/engine/caching.py +0 -1
rasa/engine/graph.py +18 -6
rasa/engine/recipes/config_files/default_config.yml +3 -3
rasa/engine/recipes/default_components.py +1 -1
rasa/engine/recipes/default_recipe.py +4 -5
rasa/engine/recipes/recipe.py +1 -1
rasa/engine/runner/dask.py +3 -9
rasa/engine/storage/local_model_storage.py +0 -2
rasa/engine/validation.py +179 -145
rasa/exceptions.py +2 -2
rasa/graph_components/validators/default_recipe_validator.py +3 -5
rasa/hooks.py +0 -1
rasa/model.py +1 -1
rasa/model_training.py +1 -0
rasa/nlu/classifiers/diet_classifier.py +33 -52
rasa/nlu/classifiers/logistic_regression_classifier.py +9 -22
rasa/nlu/classifiers/sklearn_intent_classifier.py +16 -37
rasa/nlu/extractors/crf_entity_extractor.py +54 -97
rasa/nlu/extractors/duckling_entity_extractor.py +1 -1
rasa/nlu/featurizers/dense_featurizer/convert_featurizer.py +1 -5
rasa/nlu/featurizers/dense_featurizer/lm_featurizer.py +0 -4
rasa/nlu/featurizers/featurizer.py +1 -1
rasa/nlu/featurizers/sparse_featurizer/count_vectors_featurizer.py +18 -49
rasa/nlu/featurizers/sparse_featurizer/lexical_syntactic_featurizer.py +26 -64
rasa/nlu/featurizers/sparse_featurizer/regex_featurizer.py +3 -5
rasa/nlu/persistor.py +68 -26
rasa/nlu/selectors/response_selector.py +7 -10
rasa/nlu/test.py +0 -3
rasa/nlu/utils/hugging_face/registry.py +1 -1
rasa/nlu/utils/spacy_utils.py +1 -3
rasa/server.py +22 -7
rasa/shared/constants.py +12 -1
rasa/shared/core/command_payload_reader.py +109 -0
rasa/shared/core/constants.py +4 -5
rasa/shared/core/domain.py +57 -56
rasa/shared/core/events.py +4 -7
rasa/shared/core/flows/flow.py +9 -0
rasa/shared/core/flows/flows_list.py +12 -0
rasa/shared/core/flows/steps/action.py +7 -2
rasa/shared/core/generator.py +12 -11
rasa/shared/core/slot_mappings.py +315 -24
rasa/shared/core/slots.py +4 -2
rasa/shared/core/trackers.py +32 -14
rasa/shared/core/training_data/loading.py +0 -1
rasa/shared/core/training_data/story_reader/story_reader.py +3 -3
rasa/shared/core/training_data/story_reader/yaml_story_reader.py +11 -11
rasa/shared/core/training_data/story_writer/yaml_story_writer.py +5 -3
rasa/shared/core/training_data/structures.py +1 -1
rasa/shared/core/training_data/visualization.py +1 -1
rasa/shared/data.py +58 -1
rasa/shared/exceptions.py +36 -2
rasa/shared/importers/importer.py +1 -2
rasa/shared/importers/rasa.py +0 -1
rasa/shared/nlu/constants.py +2 -0
rasa/shared/nlu/training_data/entities_parser.py +1 -2
rasa/shared/nlu/training_data/features.py +2 -120
rasa/shared/nlu/training_data/formats/dialogflow.py +3 -2
rasa/shared/nlu/training_data/formats/rasa_yaml.py +3 -5
rasa/shared/nlu/training_data/formats/readerwriter.py +0 -1
rasa/shared/nlu/training_data/message.py +13 -0
rasa/shared/nlu/training_data/training_data.py +0 -2
rasa/shared/providers/openai/session_handler.py +2 -2
rasa/shared/utils/constants.py +3 -0
rasa/shared/utils/io.py +11 -1
rasa/shared/utils/llm.py +1 -2
rasa/shared/utils/pykwalify_extensions.py +1 -0
rasa/shared/utils/schemas/domain.yml +3 -0
rasa/shared/utils/yaml.py +44 -35
rasa/studio/auth.py +26 -10
rasa/studio/constants.py +2 -0
rasa/studio/data_handler.py +114 -107
rasa/studio/download.py +160 -27
rasa/studio/results_logger.py +137 -0
rasa/studio/train.py +6 -7
rasa/studio/upload.py +159 -134
rasa/telemetry.py +188 -34
rasa/tracing/config.py +18 -3
rasa/tracing/constants.py +26 -2
rasa/tracing/instrumentation/attribute_extractors.py +50 -41
rasa/tracing/instrumentation/instrumentation.py +290 -44
rasa/tracing/instrumentation/intentless_policy_instrumentation.py +7 -5
rasa/tracing/instrumentation/metrics.py +109 -21
rasa/tracing/metric_instrument_provider.py +83 -3
rasa/utils/cli.py +2 -1
rasa/utils/common.py +1 -1
rasa/utils/endpoints.py +1 -2
rasa/utils/io.py +72 -6
rasa/utils/licensing.py +246 -31
rasa/utils/ml_utils.py +1 -1
rasa/utils/tensorflow/data_generator.py +1 -1
rasa/utils/tensorflow/environment.py +1 -1
rasa/utils/tensorflow/model_data.py +201 -12
rasa/utils/tensorflow/model_data_utils.py +499 -500
rasa/utils/tensorflow/models.py +5 -6
rasa/utils/tensorflow/rasa_layers.py +15 -15
rasa/utils/train_utils.py +1 -1
rasa/utils/url_tools.py +53 -0
rasa/validator.py +305 -3
rasa/version.py +1 -1
{rasa_pro-3.8.18.dist-info → rasa_pro-3.9.15.dist-info}/METADATA +25 -61
{rasa_pro-3.8.18.dist-info → rasa_pro-3.9.15.dist-info}/RECORD +276 -259
rasa/core/channels/inspector/dist/assets/flowDiagram-v2-855bc5b3-85583a23.js +0 -1
rasa/utils/tensorflow/feature_array.py +0 -370
/rasa/dialogue_understanding/generator/{command_prompt_template.jinja2 → single_step/command_prompt_template.jinja2} +0 -0
{rasa_pro-3.8.18.dist-info → rasa_pro-3.9.15.dist-info}/NOTICE +0 -0
{rasa_pro-3.8.18.dist-info → rasa_pro-3.9.15.dist-info}/WHEEL +0 -0
{rasa_pro-3.8.18.dist-info → rasa_pro-3.9.15.dist-info}/entry_points.txt +0 -0

rasa/nlu/extractors/duckling_entity_extractor.py CHANGED Viewed

@@ -34,7 +34,7 @@ def extract_value(match: Dict[Text, Any]) -> Dict[Text, Any]:
 def convert_duckling_format_to_rasa(
-    matches: List[Dict[Text, Any]]
+    matches: List[Dict[Text, Any]],
 ) -> List[Dict[Text, Any]]:
     extracted = []

rasa/nlu/featurizers/dense_featurizer/convert_featurizer.py CHANGED Viewed

@@ -189,7 +189,7 @@ class ConveRTFeaturizer(DenseFeaturizer, GraphComponent):
                 f"Parameter 'model_url' of "
                 f"'{ConveRTFeaturizer.__name__}' was "
                 f"set to '{model_url}' which is strictly reserved for pytests of "
-                f"Rasa Open Source only. Due to licensing issues you are "
+                f"Rasa Pro only. Due to licensing issues you are "
                 f"not allowed to use the model from this URL. "
                 f"You can either use a community hosted URL or if you have a "
                 f"local copy of the model, pass the path to the directory "
@@ -323,13 +323,11 @@ class ConveRTFeaturizer(DenseFeaturizer, GraphComponent):
         return texts
     def _sentence_encoding_of_text(self, batch: List[Text]) -> np.ndarray:
         return self.sentence_encoding_signature(tf.convert_to_tensor(batch))[
             "default"
         ].numpy()
     def _sequence_encoding_of_text(self, batch: List[Text]) -> np.ndarray:
         return self.sequence_encoding_signature(tf.convert_to_tensor(batch))[
             "sequence_encoding"
         ].numpy()
@@ -346,7 +344,6 @@ class ConveRTFeaturizer(DenseFeaturizer, GraphComponent):
         batch_size = 64
         for attribute in DENSE_FEATURIZABLE_ATTRIBUTES:
             non_empty_examples = list(
                 filter(lambda x: x.get(attribute), training_data.training_examples)
             )
@@ -410,7 +407,6 @@ class ConveRTFeaturizer(DenseFeaturizer, GraphComponent):
             )
     def _tokenize(self, sentence: Text) -> Any:
         return self.tokenize_signature(tf.convert_to_tensor([sentence]))[
             "default"
         ].numpy()

rasa/nlu/featurizers/dense_featurizer/lm_featurizer.py CHANGED Viewed

@@ -316,7 +316,6 @@ class LanguageModelFeaturizer(DenseFeaturizer, GraphComponent):
         batch_token_ids = []
         batch_tokens = []
         for example in batch_examples:
             example_tokens, example_token_ids = self._tokenize_example(
                 example, attribute
             )
@@ -416,7 +415,6 @@ class LanguageModelFeaturizer(DenseFeaturizer, GraphComponent):
         # This doesn't affect the computation since we compute an attention mask
         # anyways.
         for example_token_ids in batch_token_ids:
             # Truncate any longer sequences so that they can be fed to the model
             if len(example_token_ids) > max_sequence_length_model:
                 example_token_ids = example_token_ids[:max_sequence_length_model]
@@ -710,7 +708,6 @@ class LanguageModelFeaturizer(DenseFeaturizer, GraphComponent):
         batch_size = 64
         for attribute in DENSE_FEATURIZABLE_ATTRIBUTES:
             non_empty_examples = list(
                 filter(lambda x: x.get(attribute), training_data.training_examples)
             )
@@ -718,7 +715,6 @@ class LanguageModelFeaturizer(DenseFeaturizer, GraphComponent):
             batch_start_index = 0
             while batch_start_index < len(non_empty_examples):
                 batch_end_index = min(
                     batch_start_index + batch_size, len(non_empty_examples)
                 )

rasa/nlu/featurizers/featurizer.py CHANGED Viewed

@@ -64,7 +64,7 @@ class Featurizer(Generic[FeatureType], ABC):
     @staticmethod
     def raise_if_featurizer_configs_are_not_compatible(
-        featurizer_configs: Iterable[Dict[Text, Any]]
+        featurizer_configs: Iterable[Dict[Text, Any]],
     ) -> None:
         """Validates that the given configurations of featurizers can be used together.

rasa/nlu/featurizers/sparse_featurizer/count_vectors_featurizer.py CHANGED Viewed

@@ -1,32 +1,30 @@
 from __future__ import annotations
 import logging
 import re
-from typing import Any, Dict, List, Optional, Text, Tuple, Set, Type, Union
-import numpy as np
 import scipy.sparse
-from sklearn.exceptions import NotFittedError
-from sklearn.feature_extraction.text import CountVectorizer
+from typing import Any, Dict, List, Optional, Text, Tuple, Set, Type
+from rasa.nlu.tokenizers.tokenizer import Tokenizer
 import rasa.shared.utils.io
 from rasa.engine.graph import GraphComponent, ExecutionContext
 from rasa.engine.recipes.default_recipe import DefaultV1Recipe
 from rasa.engine.storage.resource import Resource
 from rasa.engine.storage.storage import ModelStorage
+from rasa.nlu.featurizers.sparse_featurizer.sparse_featurizer import SparseFeaturizer
+from rasa.nlu.utils.spacy_utils import SpacyModel
+from rasa.shared.constants import DOCS_URL_COMPONENTS
+import rasa.utils.io as io_utils
+from sklearn.exceptions import NotFittedError
+from sklearn.feature_extraction.text import CountVectorizer
+from rasa.shared.nlu.training_data.training_data import TrainingData
+from rasa.shared.nlu.training_data.message import Message
+from rasa.shared.exceptions import RasaException, FileIOException
 from rasa.nlu.constants import (
     TOKENS_NAMES,
     MESSAGE_ATTRIBUTES,
     DENSE_FEATURIZABLE_ATTRIBUTES,
 )
-from rasa.nlu.featurizers.sparse_featurizer.sparse_featurizer import SparseFeaturizer
-from rasa.nlu.tokenizers.tokenizer import Tokenizer
-from rasa.nlu.utils.spacy_utils import SpacyModel
-from rasa.shared.constants import DOCS_URL_COMPONENTS
-from rasa.shared.exceptions import RasaException, FileIOException
 from rasa.shared.nlu.constants import TEXT, INTENT, INTENT_RESPONSE_KEY, ACTION_NAME
-from rasa.shared.nlu.training_data.message import Message
-from rasa.shared.nlu.training_data.training_data import TrainingData
 BUFFER_SLOTS_PREFIX = "buf_"
@@ -101,7 +99,6 @@ class CountVectorsFeaturizer(SparseFeaturizer, GraphComponent):
         return ["sklearn"]
     def _load_count_vect_params(self) -> None:
         # Use shared vocabulary between text and all other attributes of Message
         self.use_shared_vocab = self._config["use_shared_vocab"]
@@ -342,7 +339,7 @@ class CountVectorsFeaturizer(SparseFeaturizer, GraphComponent):
     @staticmethod
     def _convert_attribute_tokens_to_texts(
-        attribute_tokens: Dict[Text, List[List[Text]]]
+        attribute_tokens: Dict[Text, List[List[Text]]],
     ) -> Dict[Text, List[Text]]:
         attribute_texts = {}
@@ -661,7 +658,6 @@ class CountVectorsFeaturizer(SparseFeaturizer, GraphComponent):
         for message in messages:
             for attribute in self._attributes:
                 message_tokens = self._get_processed_message_tokens_by_attribute(
                     message, attribute
                 )
@@ -687,36 +683,11 @@ class CountVectorsFeaturizer(SparseFeaturizer, GraphComponent):
     @staticmethod
     def _is_any_model_trained(
-        attribute_vocabularies: Dict[Text, Optional[Dict[Text, int]]]
+        attribute_vocabularies: Dict[Text, Optional[Dict[Text, int]]],
     ) -> bool:
         """Check if any model got trained."""
         return any(value is not None for value in attribute_vocabularies.values())
-    @staticmethod
-    def convert_vocab(
-        vocab: Dict[str, Union[int, Optional[Dict[str, int]]]], to_int: bool
-    ) -> Dict[str, Union[None, int, np.int64, Dict[str, Union[int, np.int64]]]]:
-        """Converts numpy integers in the vocabulary to Python integers."""
-        def convert_value(value: int) -> Union[int, np.int64]:
-            """Helper function to convert a single value based on to_int flag."""
-            return int(value) if to_int else np.int64(value)
-        result_dict: Dict[
-            str, Union[None, int, np.int64, Dict[str, Union[int, np.int64]]]
-        ] = {}
-        for key, sub_dict in vocab.items():
-            if isinstance(sub_dict, int):
-                result_dict[key] = convert_value(sub_dict)
-            elif not sub_dict:
-                result_dict[key] = None
-            else:
-                result_dict[key] = {
-                    sub_key: convert_value(value) for sub_key, value in sub_dict.items()
-                }
-        return result_dict
     def persist(self) -> None:
         """Persist this model into the passed directory.
@@ -730,18 +701,17 @@ class CountVectorsFeaturizer(SparseFeaturizer, GraphComponent):
             attribute_vocabularies = self._collect_vectorizer_vocabularies()
             if self._is_any_model_trained(attribute_vocabularies):
                 # Definitely need to persist some vocabularies
-                featurizer_file = model_dir / "vocabularies.json"
+                featurizer_file = model_dir / "vocabularies.pkl"
                 # Only persist vocabulary from one attribute if `use_shared_vocab`.
                 # Can be loaded and distributed to all attributes.
-                loaded_vocab = (
+                vocab = (
                     attribute_vocabularies[TEXT]
                     if self.use_shared_vocab
                     else attribute_vocabularies
                 )
-                vocab = self.convert_vocab(loaded_vocab, to_int=True)
-                rasa.shared.utils.io.dump_obj_as_json_to_file(featurizer_file, vocab)
+                io_utils.json_pickle(featurizer_file, vocab)
                 # Dump OOV words separately as they might have been modified during
                 # training
@@ -816,9 +786,8 @@ class CountVectorsFeaturizer(SparseFeaturizer, GraphComponent):
         """Loads trained component (see parent class for full docstring)."""
         try:
             with model_storage.read_from(resource) as model_dir:
-                featurizer_file = model_dir / "vocabularies.json"
-                vocabulary = rasa.shared.utils.io.read_json_file(featurizer_file)
-                vocabulary = cls.convert_vocab(vocabulary, to_int=False)
+                featurizer_file = model_dir / "vocabularies.pkl"
+                vocabulary = io_utils.json_unpickle(featurizer_file)
                 share_vocabulary = config["use_shared_vocab"]

rasa/nlu/featurizers/sparse_featurizer/lexical_syntactic_featurizer.py CHANGED Viewed

@@ -1,7 +1,9 @@
 from __future__ import annotations
 import logging
 from collections import OrderedDict
+import scipy.sparse
+import numpy as np
 from typing import (
     Any,
     Dict,
@@ -15,34 +17,30 @@ from typing import (
     Union,
 )
-import numpy as np
-import scipy.sparse
-import rasa.shared.utils.io
-import rasa.utils.io
 from rasa.engine.graph import ExecutionContext, GraphComponent
 from rasa.engine.recipes.default_recipe import DefaultV1Recipe
 from rasa.engine.storage.resource import Resource
 from rasa.engine.storage.storage import ModelStorage
-from rasa.nlu.constants import TOKENS_NAMES
-from rasa.nlu.featurizers.sparse_featurizer.sparse_featurizer import SparseFeaturizer
 from rasa.nlu.tokenizers.spacy_tokenizer import POS_TAG_KEY, SpacyTokenizer
 from rasa.nlu.tokenizers.tokenizer import Token, Tokenizer
+from rasa.nlu.featurizers.sparse_featurizer.sparse_featurizer import SparseFeaturizer
+from rasa.nlu.constants import TOKENS_NAMES
 from rasa.shared.constants import DOCS_URL_COMPONENTS
-from rasa.shared.exceptions import InvalidConfigException
-from rasa.shared.nlu.constants import TEXT
-from rasa.shared.nlu.training_data.message import Message
 from rasa.shared.nlu.training_data.training_data import TrainingData
+from rasa.shared.nlu.training_data.message import Message
+from rasa.shared.nlu.constants import TEXT
+from rasa.shared.exceptions import InvalidConfigException
+import rasa.shared.utils.io
+import rasa.utils.io
 logger = logging.getLogger(__name__)
 END_OF_SENTENCE = "EOS"
 BEGIN_OF_SENTENCE = "BOS"
 FEATURES = "features"
-SEPERATOR = "###"
 @DefaultV1Recipe.register(
     DefaultV1Recipe.ComponentType.MESSAGE_FEATURIZER, is_trainable=True
@@ -74,13 +72,11 @@ class LexicalSyntacticFeaturizer(SparseFeaturizer, GraphComponent):
       of the token at position `t+1`.
     """
-    FILENAME_FEATURE_TO_IDX_DICT = "feature_to_idx_dict.json"
+    FILENAME_FEATURE_TO_IDX_DICT = "feature_to_idx_dict.pkl"
     # NOTE: "suffix5" of the token "is" will be "is". Hence, when combining multiple
     # prefixes, short words will be represented/encoded repeatedly.
-    _FUNCTION_DICT: Dict[
-        Text, Callable[[Token], Union[Text, bool, None]]
-    ] = {  # noqa: RUF012
+    _FUNCTION_DICT: Dict[Text, Callable[[Token], Union[Text, bool, None]]] = {  # noqa: RUF012
         "low": lambda token: token.text.islower(),
         "title": lambda token: token.text.istitle(),
         "prefix5": lambda token: token.text[:5],
@@ -331,7 +327,6 @@ class LexicalSyntacticFeaturizer(SparseFeaturizer, GraphComponent):
         assert len(window_range) == window_size
         for anchor in range(len(tokens)):
             token_features: Dict[Tuple[int, Text], Text] = {}
             for window_position, relative_position in enumerate(window_range):
@@ -343,13 +338,13 @@ class LexicalSyntacticFeaturizer(SparseFeaturizer, GraphComponent):
                 token = tokens[absolute_position]
                 for feature_name in self._feature_config[window_position]:
-                    token_features[
-                        (window_position, feature_name)
-                    ] = self._extract_raw_features_from_token(
-                        token=token,
-                        feature_name=feature_name,
-                        token_position=absolute_position,
-                        num_tokens=len(tokens),
+                    token_features[(window_position, feature_name)] = (
+                        self._extract_raw_features_from_token(
+                            token=token,
+                            feature_name=feature_name,
+                            token_position=absolute_position,
+                            num_tokens=len(tokens),
+                        )
                     )
             sentence_features.append(token_features)
@@ -358,7 +353,7 @@ class LexicalSyntacticFeaturizer(SparseFeaturizer, GraphComponent):
     @staticmethod
     def _build_feature_to_index_map(
-        feature_vocabulary: Dict[Tuple[int, Text], Set[Text]]
+        feature_vocabulary: Dict[Tuple[int, Text], Set[Text]],
     ) -> Dict[Tuple[int, Text], Dict[Text, int]]:
         """Creates a nested dictionary for mapping raw features to indices.
@@ -493,32 +488,6 @@ class LexicalSyntacticFeaturizer(SparseFeaturizer, GraphComponent):
         """Creates a new untrained component (see parent class for full docstring)."""
         return cls(config, model_storage, resource, execution_context)
-    @staticmethod
-    def _restructure_feature_to_idx_dict(
-        loaded_data: Dict[str, Dict[str, int]],
-    ) -> Dict[Tuple[int, str], Dict[str, int]]:
-        """Reconstructs the feature to idx dict.
-        When storing the feature_to_idx_dict to disk, we need to convert the tuple (key)
-        into a string to be able to store it via json. When loading the data
-        we need to reconstruct the tuple from the stored string.
-        Args:
-            loaded_data: The loaded feature to idx dict from file.
-        Returns:
-            The reconstructed feature_to_idx_dict
-        """
-        feature_to_idx_dict = {}
-        for tuple_string, feature_value in loaded_data.items():
-            # Example of tuple_string: "1###low"
-            index, feature_name = tuple_string.split(SEPERATOR)
-            feature_key = (int(index), feature_name)
-            feature_to_idx_dict[feature_key] = feature_value
-        return feature_to_idx_dict
     @classmethod
     def load(
         cls,
@@ -531,13 +500,10 @@ class LexicalSyntacticFeaturizer(SparseFeaturizer, GraphComponent):
         """Loads trained component (see parent class for full docstring)."""
         try:
             with model_storage.read_from(resource) as model_path:
-                loaded_data = rasa.shared.utils.io.read_json_file(
+                feature_to_idx_dict = rasa.utils.io.json_unpickle(
                     model_path / cls.FILENAME_FEATURE_TO_IDX_DICT,
+                    encode_non_string_keys=True,
                 )
-                # convert the key back into tuple
-                feature_to_idx_dict = cls._restructure_feature_to_idx_dict(loaded_data)
                 return cls(
                     config=config,
                     model_storage=model_storage,
@@ -562,13 +528,9 @@ class LexicalSyntacticFeaturizer(SparseFeaturizer, GraphComponent):
         if not self._feature_to_idx_dict:
             return None
-        # as we cannot dump tuples, convert the tuple into a string
-        restructured_feature_dict = {
-            f"{k[0]}{SEPERATOR}{k[1]}": v for k, v in self._feature_to_idx_dict.items()
-        }
         with self._model_storage.write_to(self._resource) as model_path:
-            rasa.shared.utils.io.dump_obj_as_json_to_file(
+            rasa.utils.io.json_pickle(
                 model_path / self.FILENAME_FEATURE_TO_IDX_DICT,
-                restructured_feature_dict,
+                self._feature_to_idx_dict,
+                encode_non_string_keys=True,
             )

rasa/nlu/featurizers/sparse_featurizer/regex_featurizer.py CHANGED Viewed

@@ -1,13 +1,11 @@
 from __future__ import annotations
 import logging
 import re
 from typing import Any, Dict, List, Optional, Text, Tuple, Type
 import numpy as np
 import scipy.sparse
 from rasa.nlu.tokenizers.tokenizer import Tokenizer
 import rasa.shared.utils.io
 import rasa.utils.io
 import rasa.nlu.utils.pattern_utils as pattern_utils
@@ -242,7 +240,7 @@ class RegexFeaturizer(SparseFeaturizer, GraphComponent):
         try:
             with model_storage.read_from(resource) as model_dir:
-                patterns_file_name = model_dir / "patterns.json"
+                patterns_file_name = model_dir / "patterns.pkl"
                 known_patterns = rasa.shared.utils.io.read_json_file(patterns_file_name)
         except (ValueError, FileNotFoundError):
             logger.warning(
@@ -260,7 +258,7 @@ class RegexFeaturizer(SparseFeaturizer, GraphComponent):
     def _persist(self) -> None:
         with self._model_storage.write_to(self._resource) as model_dir:
-            regex_file = model_dir / "patterns.json"
+            regex_file = model_dir / "patterns.pkl"
             rasa.shared.utils.io.dump_obj_as_json_to_file(
                 regex_file, self.known_patterns
             )

rasa/nlu/persistor.py CHANGED Viewed

@@ -1,16 +1,18 @@
 import abc
-import logging
+import structlog
 import os
 import shutil
 from typing import Optional, Text, Tuple, TYPE_CHECKING
+from rasa.shared.exceptions import RasaException
 import rasa.shared.utils.common
 import rasa.utils.common
 if TYPE_CHECKING:
     from azure.storage.blob import ContainerClient
-logger = logging.getLogger(__name__)
+structlogger = structlog.get_logger()
 def get_persistor(name: Text) -> Optional["Persistor"]:
@@ -95,7 +97,6 @@ class Persistor(abc.ABC):
     @staticmethod
     def _tar_name(model_name: Text, include_extension: bool = True) -> Text:
         ext = ".tar.gz" if include_extension else ""
         return f"{model_name}{ext}"
@@ -129,20 +130,36 @@ class AWSPersistor(Persistor):
     def _ensure_bucket_exists(
         self, bucket_name: Text, region_name: Optional[Text] = None
     ) -> None:
-        import boto3
         import botocore
-        if not region_name:
-            region_name = boto3.DEFAULT_SESSION.region_name
-        bucket_config = {"LocationConstraint": region_name}
         # noinspection PyUnresolvedReferences
         try:
-            self.s3.create_bucket(
-                Bucket=bucket_name, CreateBucketConfiguration=bucket_config
-            )
-        except botocore.exceptions.ClientError:
-            pass  # bucket already exists
+            self.s3.meta.client.head_bucket(Bucket=bucket_name)
+        except botocore.exceptions.ClientError as e:
+            error_code = int(e.response["Error"]["Code"])
+            if error_code == 403:
+                log = (
+                    f"Access to the specified bucket '{bucket_name}' is forbidden. "
+                    "Please make sure you have the necessary "
+                    "permission to access the bucket."
+                )
+                structlogger.error(
+                    "aws_persistor.ensure_bucket_exists.bucket_access_forbidden",
+                    bucket_name=bucket_name,
+                    event_info=log,
+                )
+                raise RasaException(log)
+            elif error_code == 404:
+                log = (
+                    f"The specified bucket '{bucket_name}' does not exist. "
+                    "Please make sure to create the bucket first."
+                )
+                structlogger.error(
+                    "aws_persistor.ensure_bucket_exists.bucket_not_found",
+                    bucket_name=bucket_name,
+                    event_info=log,
+                )
+                raise RasaException(log)
     def _persist_tar(self, file_key: Text, tar_path: Text) -> None:
         """Uploads a model persisted in the `target_dir` to s3."""
@@ -180,10 +197,30 @@ class GCSPersistor(Persistor):
         from google.cloud import exceptions
         try:
-            self.storage_client.create_bucket(bucket_name)
-        except exceptions.Conflict:
-            # bucket exists
-            pass
+            self.storage_client.get_bucket(bucket_name)
+        except exceptions.NotFound:
+            log = (
+                f"The specified bucket '{bucket_name}' does not exist. "
+                "Please make sure to create the bucket first."
+            )
+            structlogger.error(
+                "gcp_persistor.ensure_bucket_exists.bucket_not_found",
+                bucket_name=bucket_name,
+                event_info=log,
+            )
+            raise RasaException(log)
+        except exceptions.Forbidden:
+            log = (
+                f"Access to the specified bucket '{bucket_name}' is forbidden. "
+                "Please make sure you have the necessary "
+                "permission to access the bucket. "
+            )
+            structlogger.error(
+                "gcp_persistor.ensure_bucket_exists.bucket_access_forbidden",
+                bucket_name=bucket_name,
+                event_info=log,
+            )
+            raise RasaException(log)
     def _persist_tar(self, file_key: Text, tar_path: Text) -> None:
         """Uploads a model persisted in the `target_dir` to GCS."""
@@ -210,18 +247,23 @@ class AzurePersistor(Persistor):
             account_url=f"https://{azure_account_name}.blob.core.windows.net/",
             credential=azure_account_key,
         )
-        self._ensure_container_exists(azure_container)
         self.container_name = azure_container
+        self._ensure_container_exists()
-    def _ensure_container_exists(self, container_name: Text) -> None:
-        from azure.core.exceptions import ResourceExistsError
-        try:
-            self.blob_service.create_container(container_name)
-        except ResourceExistsError:
-            # no need to create the container, it already exists
+    def _ensure_container_exists(self) -> None:
+        if self._container_client().exists():
             pass
+        else:
+            log = (
+                f"The specified container '{self.container_name}' does not exist."
+                "Please make sure to create the container first."
+            )
+            structlogger.error(
+                "azure_persistor.ensure_container_exists.container_not_found",
+                container_name=self.container_name,
+                event_info=log,
+            )
+            raise RasaException(log)
     def _container_client(self) -> "ContainerClient":
         return self.blob_service.get_container_client(self.container_name)

rasa/nlu/selectors/response_selector.py CHANGED Viewed

@@ -430,9 +430,9 @@ class ResponseSelector(DIETClassifier):
         self, message: Message, prediction_dict: Dict[Text, Any], selector_key: Text
     ) -> None:
         message_selector_properties = message.get(RESPONSE_SELECTOR_PROPERTY_NAME, {})
-        message_selector_properties[
-            RESPONSE_SELECTOR_RETRIEVAL_INTENTS
-        ] = self.all_retrieval_intents
+        message_selector_properties[RESPONSE_SELECTOR_RETRIEVAL_INTENTS] = (
+            self.all_retrieval_intents
+        )
         message_selector_properties[selector_key] = prediction_dict
         message.set(
             RESPONSE_SELECTOR_PROPERTY_NAME,
@@ -505,7 +505,6 @@ class ResponseSelector(DIETClassifier):
             been caught earlier and a warning should have been raised.
         """
         for key, responses in self.responses.items():
             # First check if the predicted label was the key itself
             search_key = util.template_key_to_intent_response_key(key)
             if search_key == label.get("name"):
@@ -626,7 +625,6 @@ class ResponseSelector(DIETClassifier):
         config: Dict[Text, Any],
         finetune_mode: bool = False,
     ) -> "RasaModel":
         predict_data_example = RasaModelData(
             label_key=model_data_example.label_key,
             data={
@@ -723,7 +721,6 @@ class DIET2BOW(DIET):
             logger.debug(f"  {metric} ({name})")
     def _update_label_metrics(self, loss: tf.Tensor, acc: tf.Tensor) -> None:
         self.response_loss.update_state(loss)
         self.response_acc.update_state(acc)
@@ -796,10 +793,10 @@ class DIET2DIET(DIET):
             (self.text_name, self.config),
             (self.label_name, label_config),
         ]:
-            self._tf_layers[
-                f"sequence_layer.{attribute}"
-            ] = rasa_layers.RasaSequenceLayer(
-                attribute, self.data_signature[attribute], config
+            self._tf_layers[f"sequence_layer.{attribute}"] = (
+                rasa_layers.RasaSequenceLayer(
+                    attribute, self.data_signature[attribute], config
+                )
             )
         if self.config[MASKED_LM]:

rasa/nlu/test.py CHANGED Viewed

@@ -886,7 +886,6 @@ def evaluate_entities(
             exclude_label=NO_ENTITY,
         )
         if output_directory:
             _dump_report(output_directory, f"{extractor}_report.json", report)
         if successes:
@@ -1550,7 +1549,6 @@ async def combine_result(
 def _contains_entity_labels(entity_results: List[EntityEvaluationResult]) -> bool:
     for result in entity_results:
         if result.entity_targets or result.entity_predictions:
             return True
@@ -1791,7 +1789,6 @@ async def compare_nlu(
     training_examples_per_run = []
     for run in range(runs):
         logger.info("Beginning comparison run {}/{}".format(run + 1, runs))
         run_path = os.path.join(output, "run_{}".format(run + 1))

rasa/nlu/utils/hugging_face/registry.py CHANGED Viewed

@@ -25,7 +25,7 @@ from transformers import (  # noqa: E402
     RobertaTokenizer,
     CamembertTokenizer,
 )
-from rasa.nlu.utils.hugging_face.transformers_pre_post_processors import (  # noqa: E402, E501
+from rasa.nlu.utils.hugging_face.transformers_pre_post_processors import (  # noqa: E402
     bert_tokens_pre_processor,
     gpt_tokens_pre_processor,
     xlnet_tokens_pre_processor,

rasa-pro 3.8.18__py3-none-any.whl → 3.9.15__py3-none-any.whl

Potentially problematic release.

rasa-pro 3.8.18py3-none-any.whl → 3.9.15py3-none-any.whl