PyPI - rasa-pro - Versions diffs - 3.11.0a3__py3-none-any.whl → 3.11.0a4.dev1__py3-none-any.whl - Mend

rasa-pro 3.11.0a3py3-none-any.whl → 3.11.0a4.dev1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of rasa-pro might be problematic. Click here for more details.

Files changed (51) hide show

README.md +17 -396
rasa/api.py +4 -0
rasa/cli/arguments/train.py +14 -0
rasa/cli/inspect.py +1 -1
rasa/cli/interactive.py +1 -0
rasa/cli/project_templates/calm/endpoints.yml +7 -2
rasa/cli/project_templates/tutorial/endpoints.yml +7 -2
rasa/cli/train.py +3 -0
rasa/constants.py +2 -0
rasa/core/actions/action.py +75 -33
rasa/core/actions/action_repeat_bot_messages.py +72 -0
rasa/core/actions/e2e_stub_custom_action_executor.py +5 -1
rasa/core/actions/http_custom_action_executor.py +4 -0
rasa/core/channels/socketio.py +5 -1
rasa/core/channels/voice_ready/utils.py +6 -5
rasa/core/channels/voice_stream/browser_audio.py +1 -1
rasa/core/channels/voice_stream/twilio_media_streams.py +1 -1
rasa/core/nlg/contextual_response_rephraser.py +19 -2
rasa/core/persistor.py +87 -21
rasa/core/utils.py +53 -22
rasa/dialogue_understanding/commands/__init__.py +4 -0
rasa/dialogue_understanding/commands/repeat_bot_messages_command.py +60 -0
rasa/dialogue_understanding/generator/single_step/command_prompt_template.jinja2 +3 -0
rasa/dialogue_understanding/generator/single_step/single_step_llm_command_generator.py +19 -0
rasa/dialogue_understanding/patterns/default_flows_for_patterns.yml +5 -0
rasa/dialogue_understanding/patterns/repeat.py +37 -0
rasa/e2e_test/utils/io.py +2 -0
rasa/model_manager/__init__.py +0 -0
rasa/model_manager/config.py +18 -0
rasa/model_manager/model_api.py +469 -0
rasa/model_manager/runner_service.py +279 -0
rasa/model_manager/socket_bridge.py +143 -0
rasa/model_manager/studio_jwt_auth.py +86 -0
rasa/model_manager/trainer_service.py +332 -0
rasa/model_manager/utils.py +66 -0
rasa/model_service.py +109 -0
rasa/model_training.py +25 -7
rasa/shared/constants.py +6 -0
rasa/shared/core/constants.py +2 -0
rasa/shared/providers/llm/self_hosted_llm_client.py +15 -3
rasa/shared/utils/yaml.py +10 -1
rasa/utils/endpoints.py +27 -1
rasa/version.py +1 -1
rasa_pro-3.11.0a4.dev1.dist-info/METADATA +197 -0
{rasa_pro-3.11.0a3.dist-info → rasa_pro-3.11.0a4.dev1.dist-info}/RECORD +48 -38
rasa/keys +0 -1
rasa/llm_fine_tuning/notebooks/unsloth_finetuning.ipynb +0 -407
rasa_pro-3.11.0a3.dist-info/METADATA +0 -576
{rasa_pro-3.11.0a3.dist-info → rasa_pro-3.11.0a4.dev1.dist-info}/NOTICE +0 -0
{rasa_pro-3.11.0a3.dist-info → rasa_pro-3.11.0a4.dev1.dist-info}/WHEEL +0 -0
{rasa_pro-3.11.0a3.dist-info → rasa_pro-3.11.0a4.dev1.dist-info}/entry_points.txt +0 -0

rasa/model_manager/model_api.py ADDED Viewed

@@ -0,0 +1,469 @@
+import asyncio
+from functools import wraps
+import os
+from http import HTTPStatus
+from typing import Any, Dict, Optional, Callable
+import dotenv
+from sanic import Blueprint, Sanic, response
+from sanic.response import json
+from sanic.exceptions import NotFound
+from sanic.request import Request
+import structlog
+from socketio import AsyncServer
+from rasa.exceptions import ModelNotFound
+from rasa.model_manager import config, studio_jwt_auth
+from rasa.model_manager.config import SERVER_BASE_URL
+from rasa.constants import MODEL_ARCHIVE_EXTENSION
+from rasa.model_manager.runner_service import (
+    BotSession,
+    fetch_remote_model_to_dir,
+    run_bot,
+    terminate_bot,
+    update_bot_status,
+)
+from rasa.model_manager.socket_bridge import create_bridge_server
+from rasa.model_manager.trainer_service import (
+    TrainingSession,
+    run_training,
+    terminate_training,
+    update_training_status,
+)
+from rasa.model_manager.utils import (
+    get_logs_content,
+    logs_base_path,
+    models_base_path,
+    subpath,
+)
+dotenv.load_dotenv()
+structlogger = structlog.get_logger()
+# A simple in-memory store for training sessions and running bots
+trainings: Dict[str, TrainingSession] = {}
+running_bots: Dict[str, BotSession] = {}
+def prepare_working_directories() -> None:
+    """Make sure all required directories exist."""
+    os.makedirs(logs_base_path(), exist_ok=True)
+    os.makedirs(models_base_path(), exist_ok=True)
+def cleanup_training_processes() -> None:
+    """Terminate all running training processes."""
+    structlogger.debug("model_trainer.cleanup_processes.started")
+    running = list(trainings.values())
+    for training in running:
+        terminate_training(training)
+def cleanup_bot_processes() -> None:
+    """Terminate all running bot processes."""
+    structlogger.debug("model_runner.cleanup_processes.started")
+    running = list(running_bots.values())
+    for bot in running:
+        terminate_bot(bot)
+def update_status_of_all_trainings() -> None:
+    """Update the status of all training processes."""
+    running = list(trainings.values())
+    for training in running:
+        update_training_status(training)
+async def update_status_of_all_bots() -> None:
+    """Update the status of all bot processes."""
+    # we need to get the values first, because (since we are async and waiting
+    # within the loop) some other job on the asyncio loop could change the dict
+    # (adding or removing). python doesn't like if you change the size of a dict
+    # while iterating over it and will raise a RuntimeError. so we get the values
+    # first and iterate over them to avoid that.
+    running = list(running_bots.values())
+    for bot in running:
+        await update_bot_status(bot)
+def base_server_url(request: Request) -> str:
+    """Return the base URL of the server."""
+    if SERVER_BASE_URL:
+        return SERVER_BASE_URL.rstrip("/")
+    else:
+        return f"{request.scheme}://{request.host}"
+async def continuously_update_process_status() -> None:
+    """Regularly Update the status of all training and bot processes."""
+    structlogger.debug("model_api.update_process_status.started")
+    while True:
+        try:
+            update_status_of_all_trainings()
+            await update_status_of_all_bots()
+        except asyncio.exceptions.CancelledError:
+            structlogger.debug("model_api.update_process_status.cancelled")
+            break
+        except Exception as e:
+            structlogger.error("model_api.update_process_status.error", error=str(e))
+        finally:
+            await asyncio.sleep(1)
+def requires_studio_auth() -> Callable:
+    """Wraps a request handler with token authentication."""
+    def decorator(f: Callable) -> Callable:
+        @wraps(f)
+        async def decorated(
+            request: Request, *args: Any, **kwargs: Any
+        ) -> response.HTTPResponse:
+            # get token from bearer in auth header
+            provided = request.headers.get("Authorization", "").split("Bearer ")[-1]
+            try:
+                studio_jwt_auth.authenticate_user_to_service(provided)
+                return await f(request, *args, **kwargs)
+            except studio_jwt_auth.UserToServiceAuthenticationError:
+                return response.json({"message": "User not authenticated."}, status=401)
+        return decorated
+    return decorator
+def internal_blueprint() -> Blueprint:
+    """Create a blueprint for the model manager API."""
+    bp = Blueprint("model_api_internal")
+    @bp.before_server_stop
+    async def cleanup_processes(app: Sanic, loop: asyncio.AbstractEventLoop) -> None:
+        """Terminate all running processes before the server stops."""
+        structlogger.debug("model_api.cleanup_processes.started")
+        cleanup_training_processes()
+        cleanup_bot_processes()
+    @bp.on_request  # type: ignore[misc]
+    async def limit_parallel_training_requests(request: Request) -> Any:
+        """Limit the number of parallel training requests."""
+        from rasa.model_manager.config import MAX_PARALLEL_TRAININGS
+        if not request.url.endswith("/training"):
+            return None
+        running_requests = len(
+            [
+                training
+                for training in trainings.values()
+                if training.status == "running" and training.process.poll() is None
+            ]
+        )
+        if running_requests >= int(MAX_PARALLEL_TRAININGS):
+            return response.json(
+                {
+                    "message": f"Too many parallel training requests, above "
+                    f"the limit of {MAX_PARALLEL_TRAININGS}. "
+                    f"Retry later or increase your server's "
+                    f"memory and CPU resources."
+                },
+                status=HTTPStatus.TOO_MANY_REQUESTS,
+            )
+    @bp.on_request  # type: ignore[misc]
+    async def limit_parallel_bot_runs(request: Request) -> Any:
+        """Limit the number of parallel bot runs."""
+        from rasa.model_manager.config import MAX_PARALLEL_TRAININGS
+        if not request.url.endswith("/bot"):
+            return None
+        running_requests = len(
+            [
+                bot
+                for bot in running_bots.values()
+                if bot.status in {"running", "queued"}
+            ]
+        )
+        if running_requests >= int(MAX_PARALLEL_TRAININGS):
+            return response.json(
+                {
+                    "message": f"Too many parallel bot runs, above "
+                    f"the limit of {MAX_PARALLEL_TRAININGS}. "
+                    f"Retry later or increase your server's "
+                    f"memory and CPU resources."
+                },
+                status=HTTPStatus.TOO_MANY_REQUESTS,
+            )
+    @bp.get("/")
+    async def health(request: Request) -> response.HTTPResponse:
+        return json(
+            {
+                "status": "ok",
+                "bots": [
+                    {
+                        "deployment_id": bot.deployment_id,
+                        "status": bot.status,
+                        "internal_url": bot.internal_url,
+                        "url": bot.url,
+                    }
+                    for bot in running_bots.values()
+                ],
+                "trainings": [
+                    {
+                        "training_id": training.training_id,
+                        "assistant_id": training.assistant_id,
+                        "client_id": training.client_id,
+                        "progress": training.progress,
+                        "status": training.status,
+                    }
+                    for training in trainings.values()
+                ],
+            }
+        )
+    @bp.get("/training")
+    async def get_training_list(request: Request) -> response.HTTPResponse:
+        """Return a list of all training sessions for an assistant."""
+        assistant_id = request.args.get("assistant_id")
+        sessions = [
+            {
+                "training_id": session.training_id,
+                "assistant_id": session.assistant_id,
+                "client_id": session.client_id,
+                "progress": session.progress,
+                "status": session.status,
+                "model_name": session.model_name,
+                "runtime_metadata": None,
+            }
+            for session in trainings.values()
+            if session.assistant_id == assistant_id
+        ]
+        return json({"training_sessions": sessions, "total_number": len(sessions)})
+    @bp.post("/training")
+    async def start_training(request: Request) -> response.HTTPResponse:
+        """Start a new training session."""
+        data = request.json
+        training_id: Optional[str] = data.get("id")
+        assistant_id: Optional[str] = data.get("assistant_id")
+        client_id: Optional[str] = data.get("client_id")
+        encoded_training_data: Dict[str, str] = data.get("bot_config", {}).get(
+            "data", {}
+        )
+        if training_id in trainings:
+            # fail, because there apparently is already a training with this id
+            return json({"message": "Training with this id already exists"}, status=409)
+        if not assistant_id:
+            return json({"message": "Assistant id is required"}, status=400)
+        if not training_id:
+            return json({"message": "Training id is required"}, status=400)
+        try:
+            training_session = run_training(
+                training_id=training_id,
+                assistant_id=assistant_id,
+                client_id=client_id,
+                encoded_training_data=encoded_training_data,
+            )
+            trainings[training_id] = training_session
+            return json(
+                {"training_id": training_id, "model_name": training_session.model_name}
+            )
+        except Exception as e:
+            return json({"message": str(e)}, status=500)
+    @bp.get("/training/<training_id>")
+    async def get_training(request: Request, training_id: str) -> response.HTTPResponse:
+        """Return the status of a training session."""
+        if training := trainings.get(training_id):
+            return json(
+                {
+                    "training_id": training_id,
+                    "assistant_id": training.assistant_id,
+                    "client_id": training.client_id,
+                    "progress": training.progress,
+                    "model_name": training.model_name,
+                    "status": training.status,
+                    "logs": get_logs_content(training_id),
+                }
+            )
+        else:
+            return json({"message": "Training not found"}, status=404)
+    @bp.delete("/training/<training_id>")
+    async def stop_training(
+        request: Request, training_id: str
+    ) -> response.HTTPResponse:
+        # this is a no-op if the training is already done
+        if not (training := trainings.get(training_id)):
+            return json({"message": "Training session not found"}, status=404)
+        terminate_training(training)
+        return json({"training_id": training_id})
+    @bp.post("/bot")
+    async def start_bot(request: Request) -> response.HTTPResponse:
+        data = request.json
+        deployment_id: Optional[str] = data.get("deployment_id")
+        model_name: Optional[str] = data.get("model_name")
+        encoded_configs: Dict[str, str] = data.get("bot_config", {})
+        if deployment_id in running_bots:
+            # fail, because there apparently is already a bot running with this id
+            return json(
+                {"message": "Bot with this deployment id already exists"}, status=409
+            )
+        if not deployment_id:
+            return json({"message": "Deployment id is required"}, status=400)
+        if not model_name:
+            return json({"message": "Model name is required"}, status=400)
+        base_url_path = base_server_url(request)
+        try:
+            bot_session = run_bot(
+                deployment_id,
+                model_name,
+                base_url_path,
+                encoded_configs,
+            )
+            running_bots[deployment_id] = bot_session
+            return json(
+                {
+                    "deployment_id": deployment_id,
+                    "status": bot_session.status,
+                    "url": bot_session.url,
+                }
+            )
+        except ModelNotFound:
+            return json(
+                {"message": f"Model with name '{model_name}' could not be found."},
+                status=404,
+            )
+        except Exception as e:
+            return json({"message": str(e)}, status=500)
+    @bp.delete("/bot/<deployment_id>")
+    async def stop_bot(request: Request, deployment_id: str) -> response.HTTPResponse:
+        bot = running_bots.get(deployment_id)
+        if bot is None:
+            return json({"message": "Bot not found"}, status=404)
+        terminate_bot(bot)
+        return json(
+            {"deployment_id": deployment_id, "status": bot.status, "url": bot.url}
+        )
+    @bp.get("/bot/<deployment_id>")
+    async def get_bot(request: Request, deployment_id: str) -> response.HTTPResponse:
+        bot = running_bots.get(deployment_id)
+        if bot is None:
+            return json({"message": "Bot not found"}, status=404)
+        return json(
+            {
+                "deployment_id": deployment_id,
+                "status": bot.status,
+                "url": bot.url,
+                "logs": get_logs_content(deployment_id),
+            }
+        )
+    @bp.get("/bot")
+    async def list_bots(request: Request) -> response.HTTPResponse:
+        bots = [
+            {
+                "deployment_id": bot.deployment_id,
+                "status": bot.status,
+                "url": bot.url,
+            }
+            for bot in running_bots.values()
+        ]
+        return json({"deployment_sessions": bots, "total_number": len(bots)})
+    return bp
+def external_blueprint() -> Blueprint:
+    """Create a blueprint for the model manager API."""
+    from rasa.core.channels.socketio import SocketBlueprint
+    sio = AsyncServer(async_mode="sanic", cors_allowed_origins=[])
+    bp = SocketBlueprint(sio, "", "model_api_external")
+    create_bridge_server(sio, running_bots)
+    @bp.get("/health")
+    async def health(request: Request) -> response.HTTPResponse:
+        return json(
+            {
+                "status": "ok",
+                "bots": [
+                    {
+                        "deployment_id": bot.deployment_id,
+                        "status": bot.status,
+                        "internal_url": bot.internal_url,
+                        "url": bot.url,
+                    }
+                    for bot in running_bots.values()
+                ],
+                "trainings": [
+                    {
+                        "training_id": training.training_id,
+                        "assistant_id": training.assistant_id,
+                        "client_id": training.client_id,
+                        "progress": training.progress,
+                        "status": training.status,
+                    }
+                    for training in trainings.values()
+                ],
+            }
+        )
+    @bp.route("/models/<model_name>")
+    @requires_studio_auth()
+    async def send_model(request: Request, model_name: str) -> response.HTTPResponse:
+        try:
+            model_path = path_to_model(model_name)
+            if not model_path:
+                return json({"message": "Model not found"}, status=404)
+            return await response.file(model_path)
+        except NotFound:
+            return json({"message": "Model not found"}, status=404)
+        except ModelNotFound:
+            return json({"message": "Model not found"}, status=404)
+    return bp
+def path_to_model(model_name: str) -> Optional[str]:
+    """Return the path to a local model."""
+    model_file_name = f"{model_name}.{MODEL_ARCHIVE_EXTENSION}"
+    model_path = subpath(models_base_path(), model_file_name)
+    if os.path.exists(model_path):
+        return model_path
+    if config.SERVER_MODEL_REMOTE_STORAGE:
+        structlogger.info(
+            "model_api.storage.fetching_remote_model",
+            model_name=model_file_name,
+        )
+        return fetch_remote_model_to_dir(
+            model_file_name,
+            models_base_path(),
+            config.SERVER_MODEL_REMOTE_STORAGE,
+        )
+    return None

rasa-pro 3.11.0a3__py3-none-any.whl → 3.11.0a4.dev1__py3-none-any.whl

Potentially problematic release.

rasa-pro 3.11.0a3py3-none-any.whl → 3.11.0a4.dev1py3-none-any.whl