PyPI - rasa-pro - Versions diffs - 3.10.6__py3-none-any.whl → 3.10.7.dev1__py3-none-any.whl - Mend

rasa-pro 3.10.6py3-none-any.whl → 3.10.7.dev1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of rasa-pro might be problematic. Click here for more details.

Files changed (61) hide show

rasa/api.py +8 -2
rasa/cli/arguments/default_arguments.py +23 -2
rasa/cli/arguments/run.py +2 -0
rasa/cli/inspect.py +5 -2
rasa/cli/run.py +7 -0
rasa/cli/train.py +9 -4
rasa/cli/utils.py +3 -3
rasa/core/agent.py +2 -2
rasa/core/brokers/kafka.py +3 -1
rasa/core/brokers/pika.py +3 -1
rasa/core/channels/voice_aware/utils.py +6 -5
rasa/core/nlg/contextual_response_rephraser.py +11 -2
rasa/{nlu → core}/persistor.py +1 -1
rasa/core/policies/enterprise_search_policy.py +11 -2
rasa/core/policies/intentless_policy.py +9 -2
rasa/core/run.py +2 -1
rasa/core/secrets_manager/constants.py +4 -0
rasa/core/secrets_manager/factory.py +8 -0
rasa/core/secrets_manager/vault.py +11 -1
rasa/core/utils.py +30 -19
rasa/dialogue_understanding/coexistence/llm_based_router.py +9 -2
rasa/dialogue_understanding/generator/llm_based_command_generator.py +11 -2
rasa/dialogue_understanding/generator/llm_command_generator.py +1 -1
rasa/e2e_test/e2e_test_runner.py +1 -1
rasa/engine/graph.py +0 -1
rasa/engine/recipes/config_files/default_config.yml +0 -3
rasa/engine/recipes/default_recipe.py +0 -1
rasa/engine/recipes/graph_recipe.py +0 -1
rasa/engine/storage/local_model_storage.py +0 -1
rasa/engine/storage/storage.py +1 -5
rasa/model_manager/__init__.py +0 -0
rasa/model_manager/config.py +7 -0
rasa/model_manager/model_api.py +424 -0
rasa/model_manager/runner_service.py +185 -0
rasa/model_manager/socket_bridge.py +44 -0
rasa/model_manager/trainer_service.py +240 -0
rasa/model_manager/utils.py +27 -0
rasa/model_service.py +43 -0
rasa/model_training.py +11 -6
rasa/server.py +1 -1
rasa/shared/constants.py +2 -0
rasa/shared/core/domain.py +101 -47
rasa/shared/core/flows/flows_list.py +19 -6
rasa/shared/core/flows/validation.py +25 -0
rasa/shared/core/flows/yaml_flows_io.py +3 -24
rasa/shared/importers/importer.py +32 -32
rasa/shared/importers/multi_project.py +23 -11
rasa/shared/importers/rasa.py +7 -2
rasa/shared/importers/remote_importer.py +2 -2
rasa/shared/importers/utils.py +3 -1
rasa/shared/nlu/training_data/training_data.py +18 -19
rasa/shared/utils/common.py +3 -22
rasa/shared/utils/llm.py +28 -2
rasa/shared/utils/schemas/model_config.yml +0 -10
rasa/tracing/instrumentation/attribute_extractors.py +1 -1
rasa/version.py +1 -1
{rasa_pro-3.10.6.dist-info → rasa_pro-3.10.7.dev1.dist-info}/METADATA +2 -2
{rasa_pro-3.10.6.dist-info → rasa_pro-3.10.7.dev1.dist-info}/RECORD +61 -53
{rasa_pro-3.10.6.dist-info → rasa_pro-3.10.7.dev1.dist-info}/NOTICE +0 -0
{rasa_pro-3.10.6.dist-info → rasa_pro-3.10.7.dev1.dist-info}/WHEEL +0 -0
{rasa_pro-3.10.6.dist-info → rasa_pro-3.10.7.dev1.dist-info}/entry_points.txt +0 -0

rasa/model_manager/trainer_service.py ADDED Viewed

@@ -0,0 +1,240 @@
+import os
+from typing import Any, Dict, Optional
+import shutil
+import base64
+import structlog
+import subprocess
+from dataclasses import dataclass
+from rasa.model_manager.config import RASA_PYTHON_PATH, SERVER_BASE_WORKING_DIRECTORY
+from rasa.model_manager.utils import logs_path
+structlogger = structlog.get_logger()
+@dataclass
+class TrainingSession:
+    """Store information about a training session."""
+    training_id: str
+    assistant_id: str
+    client_id: Optional[str]
+    progress: int
+    status: str
+    process: subprocess.Popen
+def train_path(training_id: str) -> str:
+    """Return the path to the training directory for a given training id."""
+    return os.path.abspath(f"{SERVER_BASE_WORKING_DIRECTORY}/trainings/{training_id}")
+def cache_for_assistant_path(assistant_id: str) -> str:
+    """Return the path to the cache directory for a given assistant id."""
+    return os.path.abspath(f"{SERVER_BASE_WORKING_DIRECTORY}/caches/{assistant_id}")
+def write_encoded_data_to_file(encoded_data: bytes, file: str) -> None:
+    """Write base64 encoded data to a file."""
+    # create the directory if it does not exist of the parent directory
+    os.makedirs(os.path.dirname(file), exist_ok=True)
+    with open(file, "w") as f:
+        decoded = base64.b64decode(encoded_data)
+        text = decoded.decode("utf-8")
+        f.write(text)
+def terminate_training(training: TrainingSession) -> None:
+    if training.status == "running":
+        structlogger.info(
+            "model_trainer.user_stopping_training", training_id=training.training_id
+        )
+        try:
+            training.process.terminate()
+            training.status = "stopped"
+        except ProcessLookupError:
+            structlogger.debug(
+                "model_trainer.training_process_not_found",
+                training_id=training.training_id,
+            )
+def update_training_status(training: TrainingSession) -> None:
+    if training.status != "running":
+        # skip if the training is not running
+        return
+    if training.process.poll() is None:
+        # process is still running
+        return
+    complete_training(training)
+def complete_training(training: TrainingSession) -> None:
+    """Complete a training session.
+    Transitions the status of a training process to "done" if the process has
+    finished successfully, and to "error" if the process has finished with an
+    error.
+    """
+    training.status = "done" if training.process.returncode == 0 else "error"
+    training.progress = 100
+    structlogger.info(
+        "model_trainer.training_finished",
+        training_id=training.training_id,
+        status=training.status,
+    )
+    # persist the assistant cache to speed up future training runs for this
+    # assistant
+    persist_rasa_cache(training.assistant_id, train_path(training.training_id))
+def seed_training_directory_with_rasa_cache(
+    training_base_path: str, assistant_id: str
+) -> None:
+    """Populate the training directory with the cache of a previous training."""
+    # check if there is a cache for this assistant
+    cache_path = cache_for_assistant_path(assistant_id)
+    if os.path.exists(cache_path):
+        structlogger.debug(
+            "model_trainer.populating_training_dir_with_cache",
+            assistant_id=assistant_id,
+            training_base_path=training_base_path,
+        )
+        # copy the cache to the training directory
+        shutil.copytree(cache_path, f"{training_base_path}/.rasa")
+def persist_rasa_cache(assistant_id: str, training_base_path: str) -> None:
+    """Persist the cache of a training session to speed up future trainings."""
+    # copy the cache from the training directory to the cache directory
+    # cache files are stored inside of `/.rasa/` of the training folder
+    structlogger.debug(
+        "model_trainer.persisting_assistant_cache", assistant_id=assistant_id
+    )
+    cache_path = cache_for_assistant_path(assistant_id)
+    # clean up the cache directory first
+    shutil.rmtree(cache_path, ignore_errors=True)
+    shutil.copytree(f"{training_base_path}/.rasa", cache_path)
+def write_training_data_to_files(
+    encoded_training_data: Dict[str, Any], training_base_path: str
+) -> None:
+    """Write the training data to files in the training directory.
+    Incoming data format, all keys being optional:
+    ````
+    {
+        "domain": "base64 encoded domain.yml",
+        "credentials": "base64 encoded credentials.yml",
+        "endpoints": "base64 encoded endpoints.yml",
+        "flows": "base64 encoded flows.yml",
+        "config": "base64 encoded config.yml",
+        "stories": "base64 encoded stories.yml",
+        "rules": "base64 encoded rules.yml",
+        "nlu": "base64 encoded nlu.yml"
+    }
+    ```
+    """
+    data_to_be_written_to_files = {
+        "domain": "domain.yml",
+        "credentials": "credentials.yml",
+        "endpoints": "endpoints.yml",
+        "flows": "data/flows.yml",
+        "config": "config.yml",
+        "stories": "data/stories.yml",
+        "rules": "data/rules.yml",
+        "nlu": "data/nlu.yml",
+    }
+    for key, file in data_to_be_written_to_files.items():
+        write_encoded_data_to_file(
+            encoded_training_data.get(key, ""),
+            f"{training_base_path}/{file}",
+        )
+def prepare_training_directory(
+    training_base_path: str, assistant_id: str, data: Dict[str, Any]
+) -> None:
+    """Prepare the training directory for a new training session."""
+    encoded_training_data = data.get("bot_config", {}).get("data", {})
+    # create a new working directory and store the training data from the
+    # request there. the training data in the request is base64 encoded
+    os.makedirs(training_base_path, exist_ok=True)
+    seed_training_directory_with_rasa_cache(training_base_path, assistant_id)
+    write_training_data_to_files(encoded_training_data, training_base_path)
+def start_training_process(
+    training_id: str, assistant_id: str, client_id: str, training_base_path: str
+) -> TrainingSession:
+    log_path = logs_path(training_id)
+    # Start the training in a subprocess
+    # set the working directory to the training directory
+    # run the rasa train command as a subprocess, activating poetry before running
+    # pipe the stdout and stderr to the same file
+    process = subprocess.Popen(
+        [
+            RASA_PYTHON_PATH,
+            "-m",
+            "rasa.__main__",
+            "train",
+            "--debug",
+            "--out",
+            f"{training_base_path}/models",
+            "--data",
+            f"{training_base_path}/data",
+            "--config",
+            f"{training_base_path}/config.yml",
+            "--domain",
+            f"{training_base_path}/domain.yml",
+            "--endpoints",
+            f"{training_base_path}/endpoints.yml",
+        ],
+        cwd=training_base_path,
+        stdout=open(log_path, "w"),
+        stderr=subprocess.STDOUT,
+        env=os.environ.copy(),
+    )
+    structlogger.info(
+        "model_trainer.training_started",
+        training_id=training_id,
+        assistant_id=assistant_id,
+        client_id=client_id,
+        log=log_path,
+        pid=process.pid,
+    )
+    return TrainingSession(
+        training_id=training_id,
+        assistant_id=assistant_id,
+        client_id=client_id,
+        progress=0,
+        status="running",
+        process=process,  # Store the process handle
+    )
+def run_training(
+    training_id: str, assistant_id: str, client_id: str, data: Dict
+) -> TrainingSession:
+    """Run a training session."""
+    training_base_path = train_path(training_id)
+    prepare_training_directory(training_base_path, assistant_id, data)
+    return start_training_process(
+        training_id=training_id,
+        assistant_id=assistant_id,
+        client_id=client_id,
+        training_base_path=training_base_path,
+    )

rasa/model_manager/utils.py ADDED Viewed

@@ -0,0 +1,27 @@
+import os
+from rasa.model_manager.config import SERVER_BASE_WORKING_DIRECTORY
+def logs_base_path() -> str:
+    """Return the path to the logs directory."""
+    return os.path.abspath(f"{SERVER_BASE_WORKING_DIRECTORY}/logs")
+def models_base_path() -> str:
+    """Return the path to the models directory."""
+    return os.path.abspath(f"{SERVER_BASE_WORKING_DIRECTORY}/models")
+def logs_path(action_id: str) -> str:
+    """Return the path to the log file for a given action id.
+    Args:
+        action_id: can either be a training_id or a deployment_id
+    """
+    return os.path.abspath(f"{logs_base_path()}/{action_id}.txt")
+def models_path(training_id: str) -> str:
+    """Return the path to the models directory for a given training id."""
+    return os.path.abspath(f"{models_base_path()}/{training_id}")

rasa/model_service.py ADDED Viewed

@@ -0,0 +1,43 @@
+import os
+import logging
+import structlog
+from rasa.model_manager import model_api
+from rasa.utils.common import configure_logging_and_warnings
+import rasa.utils.licensing
+structlogger = structlog.get_logger()
+MODEL_SERVICE_PORT = 8000
+def main() -> None:
+    """Start the Rasa Model Manager server.
+    The API server can receive requests to train models, run bots, and manage
+    the lifecycle of models and bots.
+    """
+    model_api.prepare_working_directories()
+    configure_logging_and_warnings(
+        log_level=logging.DEBUG,
+        logging_config_file=None,
+        warn_only_once=True,
+        filter_repeated_logs=True,
+    )
+    rasa.utils.licensing.validate_license_from_env()
+    # assert that an openai api key is set
+    assert (
+        "OPENAI_API_KEY" in os.environ
+    ), "Please set the OPENAI_API_KEY environment variable"
+    structlogger.debug("model_training.starting_server", port=MODEL_SERVICE_PORT)
+    structlogger.debug("model_running.starting_server", port=MODEL_SERVICE_PORT)
+    model_api.app.run(host="0.0.0.0", port=MODEL_SERVICE_PORT, legacy=True)
+if __name__ == "__main__":
+    main()

rasa/model_training.py CHANGED Viewed

@@ -15,6 +15,7 @@ import rasa.shared.utils.common
 import rasa.shared.utils.io
 import rasa.utils.common
 from rasa import telemetry
+from rasa.core.persistor import StorageType
 from rasa.engine.caching import LocalTrainingCache
 from rasa.engine.recipes.recipe import Recipe
 from rasa.engine.runner.dask import DaskGraphRunner
@@ -22,7 +23,6 @@ from rasa.engine.storage.local_model_storage import LocalModelStorage
 from rasa.engine.storage.storage import ModelStorage
 from rasa.engine.training.components import FingerprintStatus
 from rasa.engine.training.graph_trainer import GraphTrainer
-from rasa.nlu.persistor import StorageType
 from rasa.shared.core.domain import Domain
 from rasa.shared.core.events import SlotSet
 from rasa.shared.core.training_data.structures import StoryGraph
@@ -156,6 +156,7 @@ async def train(
     model_to_finetune: Optional[Text] = None,
     finetuning_epoch_fraction: float = 1.0,
     remote_storage: Optional[StorageType] = None,
+    file_importer: Optional[TrainingDataImporter] = None,
 ) -> TrainingResult:
     """Trains a Rasa model (Core and NLU).
@@ -177,14 +178,18 @@ async def train(
             a directory in case the latest trained model should be used.
         finetuning_epoch_fraction: The fraction currently specified training epochs
             in the model configuration which should be used for finetuning.
-        remote_storage: The remote storage which should be used to store the model.
+        remote_storage: Optional name of the remote storage to
+            use for storing the model.
+        file_importer: Instance of `TrainingDataImporter` to use for training.
+            If it is not provided, a new instance will be created.
     Returns:
         An instance of `TrainingResult`.
     """
-    file_importer = TrainingDataImporter.load_from_config(
-        config, domain, training_files, core_additional_arguments
-    )
+    if not file_importer:
+        file_importer = TrainingDataImporter.load_from_config(
+            config, domain, training_files, core_additional_arguments
+        )
     stories = file_importer.get_stories()
     flows = file_importer.get_flows()
@@ -555,7 +560,7 @@ async def train_nlu(
 def push_model_to_remote_storage(model_path: Path, remote_storage: StorageType) -> None:
     """push model to remote storage"""
-    from rasa.nlu.persistor import get_persistor
+    from rasa.core.persistor import get_persistor
     persistor = get_persistor(remote_storage)

rasa/server.py CHANGED Viewed

@@ -50,11 +50,11 @@ from rasa.core.channels.channel import (
     UserMessage,
 )
 from rasa.core.constants import DEFAULT_RESPONSE_TIMEOUT
+from rasa.core.persistor import parse_remote_storage
 from rasa.core.test import test
 from rasa.core.utils import AvailableEndpoints
 from rasa.nlu.emulators.emulator import Emulator
 from rasa.nlu.emulators.no_emulator import NoEmulator
-from rasa.nlu.persistor import parse_remote_storage
 from rasa.nlu.test import CVEvaluationResult
 from rasa.shared.constants import (
     DEFAULT_MODELS_PATH,

rasa/shared/constants.py CHANGED Viewed

@@ -183,6 +183,8 @@ STREAM_CONFIG_KEY = "stream"
 N_REPHRASES_CONFIG_KEY = "n"
 USE_CHAT_COMPLETIONS_ENDPOINT_CONFIG_KEY = "use_chat_completions_endpoint"
+LLM_API_HEALTH_CHECK_ENV_VAR = "LLM_API_HEALTH_CHECK"
 AZURE_API_KEY_ENV_VAR = "AZURE_API_KEY"
 AZURE_AD_TOKEN_ENV_VAR = "AZURE_AD_TOKEN"
 AZURE_API_BASE_ENV_VAR = "AZURE_API_BASE"

rasa-pro 3.10.6__py3-none-any.whl → 3.10.7.dev1__py3-none-any.whl

Potentially problematic release.

rasa-pro 3.10.6py3-none-any.whl → 3.10.7.dev1py3-none-any.whl