PyPI - aiverify-moonshot - Versions diffs - 0.4.0__py3-none-any.whl - Mend

aiverify-moonshot 0.4.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (163) hide show

aiverify_moonshot-0.4.0.dist-info/METADATA +249 -0
aiverify_moonshot-0.4.0.dist-info/RECORD +163 -0
aiverify_moonshot-0.4.0.dist-info/WHEEL +4 -0
aiverify_moonshot-0.4.0.dist-info/licenses/AUTHORS.md +5 -0
aiverify_moonshot-0.4.0.dist-info/licenses/LICENSE.md +201 -0
aiverify_moonshot-0.4.0.dist-info/licenses/NOTICES.md +3340 -0
moonshot/__init__.py +0 -0
moonshot/__main__.py +198 -0
moonshot/api.py +155 -0
moonshot/integrations/__init__.py +0 -0
moonshot/integrations/cli/__init__.py +0 -0
moonshot/integrations/cli/__main__.py +25 -0
moonshot/integrations/cli/active_session_cfg.py +1 -0
moonshot/integrations/cli/benchmark/__init__.py +0 -0
moonshot/integrations/cli/benchmark/benchmark.py +186 -0
moonshot/integrations/cli/benchmark/cookbook.py +545 -0
moonshot/integrations/cli/benchmark/datasets.py +164 -0
moonshot/integrations/cli/benchmark/metrics.py +141 -0
moonshot/integrations/cli/benchmark/recipe.py +598 -0
moonshot/integrations/cli/benchmark/result.py +216 -0
moonshot/integrations/cli/benchmark/run.py +140 -0
moonshot/integrations/cli/benchmark/runner.py +174 -0
moonshot/integrations/cli/cli.py +64 -0
moonshot/integrations/cli/common/__init__.py +0 -0
moonshot/integrations/cli/common/common.py +72 -0
moonshot/integrations/cli/common/connectors.py +325 -0
moonshot/integrations/cli/common/display_helper.py +42 -0
moonshot/integrations/cli/common/prompt_template.py +94 -0
moonshot/integrations/cli/initialisation/__init__.py +0 -0
moonshot/integrations/cli/initialisation/initialisation.py +14 -0
moonshot/integrations/cli/redteam/__init__.py +0 -0
moonshot/integrations/cli/redteam/attack_module.py +70 -0
moonshot/integrations/cli/redteam/context_strategy.py +147 -0
moonshot/integrations/cli/redteam/prompt_template.py +67 -0
moonshot/integrations/cli/redteam/redteam.py +90 -0
moonshot/integrations/cli/redteam/session.py +467 -0
moonshot/integrations/web_api/.env.dev +7 -0
moonshot/integrations/web_api/__init__.py +0 -0
moonshot/integrations/web_api/__main__.py +56 -0
moonshot/integrations/web_api/app.py +125 -0
moonshot/integrations/web_api/container.py +146 -0
moonshot/integrations/web_api/log/.gitkeep +0 -0
moonshot/integrations/web_api/logging_conf.py +114 -0
moonshot/integrations/web_api/routes/__init__.py +0 -0
moonshot/integrations/web_api/routes/attack_modules.py +66 -0
moonshot/integrations/web_api/routes/benchmark.py +116 -0
moonshot/integrations/web_api/routes/benchmark_result.py +175 -0
moonshot/integrations/web_api/routes/context_strategy.py +129 -0
moonshot/integrations/web_api/routes/cookbook.py +225 -0
moonshot/integrations/web_api/routes/dataset.py +120 -0
moonshot/integrations/web_api/routes/endpoint.py +282 -0
moonshot/integrations/web_api/routes/metric.py +78 -0
moonshot/integrations/web_api/routes/prompt_template.py +128 -0
moonshot/integrations/web_api/routes/recipe.py +219 -0
moonshot/integrations/web_api/routes/redteam.py +609 -0
moonshot/integrations/web_api/routes/runner.py +239 -0
moonshot/integrations/web_api/schemas/__init__.py +0 -0
moonshot/integrations/web_api/schemas/benchmark_runner_dto.py +13 -0
moonshot/integrations/web_api/schemas/cookbook_create_dto.py +19 -0
moonshot/integrations/web_api/schemas/cookbook_response_model.py +9 -0
moonshot/integrations/web_api/schemas/dataset_response_dto.py +9 -0
moonshot/integrations/web_api/schemas/endpoint_create_dto.py +21 -0
moonshot/integrations/web_api/schemas/endpoint_response_model.py +11 -0
moonshot/integrations/web_api/schemas/prompt_response_model.py +14 -0
moonshot/integrations/web_api/schemas/prompt_template_response_model.py +10 -0
moonshot/integrations/web_api/schemas/recipe_create_dto.py +32 -0
moonshot/integrations/web_api/schemas/recipe_response_model.py +7 -0
moonshot/integrations/web_api/schemas/session_create_dto.py +16 -0
moonshot/integrations/web_api/schemas/session_prompt_dto.py +7 -0
moonshot/integrations/web_api/schemas/session_response_model.py +38 -0
moonshot/integrations/web_api/services/__init__.py +0 -0
moonshot/integrations/web_api/services/attack_module_service.py +34 -0
moonshot/integrations/web_api/services/auto_red_team_test_manager.py +86 -0
moonshot/integrations/web_api/services/auto_red_team_test_state.py +57 -0
moonshot/integrations/web_api/services/base_service.py +8 -0
moonshot/integrations/web_api/services/benchmark_result_service.py +25 -0
moonshot/integrations/web_api/services/benchmark_test_manager.py +106 -0
moonshot/integrations/web_api/services/benchmark_test_state.py +56 -0
moonshot/integrations/web_api/services/benchmarking_service.py +31 -0
moonshot/integrations/web_api/services/context_strategy_service.py +22 -0
moonshot/integrations/web_api/services/cookbook_service.py +194 -0
moonshot/integrations/web_api/services/dataset_service.py +20 -0
moonshot/integrations/web_api/services/endpoint_service.py +65 -0
moonshot/integrations/web_api/services/metric_service.py +14 -0
moonshot/integrations/web_api/services/prompt_template_service.py +39 -0
moonshot/integrations/web_api/services/recipe_service.py +155 -0
moonshot/integrations/web_api/services/runner_service.py +147 -0
moonshot/integrations/web_api/services/session_service.py +350 -0
moonshot/integrations/web_api/services/utils/exceptions_handler.py +41 -0
moonshot/integrations/web_api/services/utils/results_formatter.py +47 -0
moonshot/integrations/web_api/status_updater/interface/benchmark_progress_callback.py +14 -0
moonshot/integrations/web_api/status_updater/interface/redteam_progress_callback.py +14 -0
moonshot/integrations/web_api/status_updater/moonshot_ui_webhook.py +72 -0
moonshot/integrations/web_api/types/types.py +99 -0
moonshot/src/__init__.py +0 -0
moonshot/src/api/__init__.py +0 -0
moonshot/src/api/api_connector.py +58 -0
moonshot/src/api/api_connector_endpoint.py +162 -0
moonshot/src/api/api_context_strategy.py +57 -0
moonshot/src/api/api_cookbook.py +160 -0
moonshot/src/api/api_dataset.py +46 -0
moonshot/src/api/api_environment_variables.py +17 -0
moonshot/src/api/api_metrics.py +51 -0
moonshot/src/api/api_prompt_template.py +43 -0
moonshot/src/api/api_recipe.py +182 -0
moonshot/src/api/api_red_teaming.py +59 -0
moonshot/src/api/api_result.py +84 -0
moonshot/src/api/api_run.py +74 -0
moonshot/src/api/api_runner.py +132 -0
moonshot/src/api/api_session.py +290 -0
moonshot/src/configs/__init__.py +0 -0
moonshot/src/configs/env_variables.py +187 -0
moonshot/src/connectors/__init__.py +0 -0
moonshot/src/connectors/connector.py +327 -0
moonshot/src/connectors/connector_prompt_arguments.py +17 -0
moonshot/src/connectors_endpoints/__init__.py +0 -0
moonshot/src/connectors_endpoints/connector_endpoint.py +211 -0
moonshot/src/connectors_endpoints/connector_endpoint_arguments.py +54 -0
moonshot/src/cookbooks/__init__.py +0 -0
moonshot/src/cookbooks/cookbook.py +225 -0
moonshot/src/cookbooks/cookbook_arguments.py +34 -0
moonshot/src/datasets/__init__.py +0 -0
moonshot/src/datasets/dataset.py +255 -0
moonshot/src/datasets/dataset_arguments.py +50 -0
moonshot/src/metrics/__init__.py +0 -0
moonshot/src/metrics/metric.py +192 -0
moonshot/src/metrics/metric_interface.py +95 -0
moonshot/src/prompt_templates/__init__.py +0 -0
moonshot/src/prompt_templates/prompt_template.py +103 -0
moonshot/src/recipes/__init__.py +0 -0
moonshot/src/recipes/recipe.py +340 -0
moonshot/src/recipes/recipe_arguments.py +111 -0
moonshot/src/redteaming/__init__.py +0 -0
moonshot/src/redteaming/attack/__init__.py +0 -0
moonshot/src/redteaming/attack/attack_module.py +618 -0
moonshot/src/redteaming/attack/attack_module_arguments.py +44 -0
moonshot/src/redteaming/attack/context_strategy.py +131 -0
moonshot/src/redteaming/context_strategy/__init__.py +0 -0
moonshot/src/redteaming/context_strategy/context_strategy_interface.py +46 -0
moonshot/src/redteaming/session/__init__.py +0 -0
moonshot/src/redteaming/session/chat.py +209 -0
moonshot/src/redteaming/session/red_teaming_progress.py +128 -0
moonshot/src/redteaming/session/red_teaming_type.py +6 -0
moonshot/src/redteaming/session/session.py +775 -0
moonshot/src/results/__init__.py +0 -0
moonshot/src/results/result.py +119 -0
moonshot/src/results/result_arguments.py +44 -0
moonshot/src/runners/__init__.py +0 -0
moonshot/src/runners/runner.py +476 -0
moonshot/src/runners/runner_arguments.py +46 -0
moonshot/src/runners/runner_type.py +6 -0
moonshot/src/runs/__init__.py +0 -0
moonshot/src/runs/run.py +344 -0
moonshot/src/runs/run_arguments.py +162 -0
moonshot/src/runs/run_progress.py +145 -0
moonshot/src/runs/run_status.py +10 -0
moonshot/src/storage/__init__.py +0 -0
moonshot/src/storage/db_interface.py +128 -0
moonshot/src/storage/io_interface.py +31 -0
moonshot/src/storage/storage.py +525 -0
moonshot/src/utils/__init__.py +0 -0
moonshot/src/utils/import_modules.py +96 -0
moonshot/src/utils/timeit.py +25 -0

moonshot/integrations/cli/benchmark/recipe.py ADDED Viewed

@@ -0,0 +1,598 @@
+import asyncio
+from ast import literal_eval
+import cmd2
+from rich.console import Console
+from rich.table import Table
+from slugify import slugify
+from moonshot.api import (
+    api_create_recipe,
+    api_create_runner,
+    api_delete_recipe,
+    api_get_all_recipe,
+    api_get_all_run,
+    api_get_all_runner_name,
+    api_load_runner,
+    api_read_recipe,
+    api_update_recipe,
+)
+from moonshot.integrations.cli.common.display_helper import display_view_list_format
+console = Console()
+# ------------------------------------------------------------------------------
+# CLI Functions
+# ------------------------------------------------------------------------------
+def add_recipe(args) -> None:
+    """
+    Add a new recipe.
+    This function creates a new recipe by parsing the arguments provided and then calling the api_create_recipe
+    function from the moonshot.api module.
+    It expects the arguments to be strings that can be evaluated into Python data structures using literal_eval.
+    Args:
+        args (argparse.Namespace): The arguments provided to the command line interface.
+        Expected keys are name, description, tags, categories, dataset, prompt_templates, metrics, attack_modules,
+        and grading_scale.
+    Returns:
+        None
+    Raises:
+        Exception: If there is an error during the creation of the recipe or the arguments cannot be evaluated.
+    """
+    try:
+        tags = literal_eval(args.tags) if args.tags else []
+        categories = literal_eval(args.categories)
+        datasets = literal_eval(args.datasets)
+        prompt_templates = (
+            literal_eval(args.prompt_templates) if args.prompt_templates else []
+        )
+        metrics = literal_eval(args.metrics)
+        attack_modules = (
+            literal_eval(args.attack_modules) if args.attack_modules else []
+        )
+        grading_scale = literal_eval(args.grading_scale) if args.grading_scale else {}
+        new_recipe_id = api_create_recipe(
+            args.name,
+            args.description,
+            tags,
+            categories,
+            datasets,
+            prompt_templates,
+            metrics,
+            attack_modules,
+            grading_scale,
+        )
+        print(f"[add_recipe]: Recipe ({new_recipe_id}) created.")
+    except Exception as e:
+        print(f"[add_recipe]: {str(e)}")
+def list_recipes() -> None:
+    """
+    List all available recipes.
+    This function retrieves all available recipes by calling the api_get_all_recipe function from the
+    moonshot.api module.
+    It then displays the retrieved recipes using the display_recipes function.
+    Returns:
+        None
+    """
+    try:
+        recipes_list = api_get_all_recipe()
+        display_recipes(recipes_list)
+    except Exception as e:
+        print(f"[list_recipes]: {str(e)}")
+def view_recipe(args) -> None:
+    """
+    View a specific recipe.
+    This function retrieves a specific recipe by calling the api_read_recipe function from the
+    moonshot.api module using the recipe name provided in the args.
+    It then displays the retrieved recipe using the display_view_recipe function.
+    Args:
+        args: A namespace object from argparse. It should have the following attribute:
+            recipe (str): The id of the recipe to view.
+    Returns:
+        None
+    """
+    try:
+        recipe_info = api_read_recipe(args.recipe)
+        display_recipes([recipe_info])
+    except Exception as e:
+        print(f"[view_recipe]: {str(e)}")
+def run_recipe(args) -> None:
+    """
+    Execute a recipe with the specified parameters.
+    This function runs a recipe runner with the given name, recipes, endpoints, and other parameters.
+    It checks if the runner with the specified name already exists, and if not, it creates a new one.
+    The recipes are run against the specified endpoints, and the results are processed and displayed.
+    Args:
+        args: A namespace object from argparse. It should have the following attributes:
+            name (str): The name of the recipe runner.
+            recipes (str): A string representation of a list of recipes to run.
+            endpoints (str): A string representation of a list of endpoints to run.
+            num_of_prompts (int): The number of prompts to run.
+            random_seed (int): The random seed number for reproducibility.
+            system_prompt (str): The system prompt to use.
+            runner_proc_module (str): The runner processing module to use.
+            result_proc_module (str): The result processing module to use.
+    Returns:
+        None
+    """
+    try:
+        name = args.name
+        recipes = literal_eval(args.recipes)
+        endpoints = literal_eval(args.endpoints)
+        num_of_prompts = args.num_of_prompts
+        random_seed = args.random_seed
+        system_prompt = args.system_prompt
+        runner_proc_module = args.runner_proc_module
+        result_proc_module = args.result_proc_module
+        # Run the recipes with the defined endpoints
+        slugify_id = slugify(name, lowercase=True)
+        if slugify_id in api_get_all_runner_name():
+            rec_runner = api_load_runner(slugify_id)
+        else:
+            rec_runner = api_create_runner(name, endpoints)
+        loop = asyncio.get_event_loop()
+        loop.run_until_complete(
+            rec_runner.run_recipes(
+                recipes,
+                num_of_prompts,
+                random_seed,
+                system_prompt,
+                runner_proc_module,
+                result_proc_module,
+            )
+        )
+        rec_runner.close()
+        # Display results
+        runner_runs = api_get_all_run(rec_runner.id)
+        result_info = runner_runs[-1].get("results")
+        if result_info:
+            show_recipe_results(
+                recipes, endpoints, result_info, result_info["metadata"]["duration"]
+            )
+        else:
+            raise RuntimeError("no run result generated")
+    except Exception as e:
+        print(f"[run_recipe]: {str(e)}")
+def update_recipe(args) -> None:
+    """
+    Update a specific recipe.
+    This function updates a specific recipe by calling the api_update_recipe function from the
+    moonshot.api module using the recipe name and update values provided in the args.
+    Args:
+        args: A namespace object from argparse. It should have the following attributes:
+            recipe (str): The id of the recipe to update.
+            update_values (str): A string representation of a list of tuples. Each tuple contains a key
+            and a value to update in the recipe.
+    Returns:
+        None
+    """
+    try:
+        recipe = args.recipe
+        update_values = dict(literal_eval(args.update_values))
+        api_update_recipe(recipe, **update_values)
+        print("[update_recipe]: Recipe updated.")
+    except Exception as e:
+        print(f"[update_recipe]: {str(e)}")
+def delete_recipe(args) -> None:
+    """
+    Delete a recipe.
+    This function deletes a recipe with the specified identifier. It prompts the user for confirmation before proceeding
+    with the deletion. If the user confirms, it calls the api_delete_recipe function from the moonshot.api module to
+    delete the recipe. If the deletion is successful, it prints a confirmation message. If an exception occurs, it
+    prints an error message.
+    Args:
+        args: A namespace object from argparse. It should have the following attribute:
+            recipe (str): The identifier of the recipe to delete.
+    Returns:
+        None
+    """
+    # Confirm with the user before deleting a recipe
+    confirmation = console.input(
+        "[bold red]Are you sure you want to delete the recipe (y/N)? [/]"
+    )
+    if confirmation.lower() != "y":
+        console.print("[bold yellow]Recipe deletion cancelled.[/]")
+        return
+    try:
+        api_delete_recipe(args.recipe)
+        print("[delete_recipe]: Recipe deleted.")
+    except Exception as e:
+        print(f"[delete_recipe]: {str(e)}")
+# ------------------------------------------------------------------------------
+# Helper functions: Display on cli
+# ------------------------------------------------------------------------------
+def display_view_grading_scale_format(title: str, grading_scale: dict) -> str:
+    """
+    Format the grading scale for display.
+    This function takes a title and a grading scale dictionary and formats them into a string suitable for display.
+    The grading scale dictionary is expected to have grade levels as keys and tuples representing the range as values.
+    If the grading scale is empty, it returns the title with 'nil'.
+    Args:
+        title (str): The title to display above the grading scale.
+        grading_scale (dict): A dictionary with grade levels as keys and range tuples as values.
+    Returns:
+        str: The formatted grading scale as a string.
+    """
+    if grading_scale:
+        formatted_grades = "\n".join(
+            f"{i + 1}. {grade} [{range_[0]} - {range_[1]}]"
+            for i, (grade, range_) in enumerate(grading_scale.items())
+        )
+        return f"[blue]{title}[/blue]:\n{formatted_grades}"
+    else:
+        return f"[blue]{title}[/blue]: nil"
+def display_view_statistics_format(title: str, stats: dict) -> str:
+    """
+    Format the statistics for display.
+    This function takes a title and a statistics dictionary and formats them into a string suitable for display.
+    The statistics dictionary is expected to have various statistics as keys and their counts or sub-statistics
+    as values.
+    If the statistics dictionary is empty, it returns the title with 'nil'.
+    Args:
+        title (str): The title to display above the statistics.
+        stats (dict): A dictionary with various statistics as keys and their counts or sub-statistics as values.
+    Returns:
+        str: The formatted statistics as a string.
+    """
+    if stats:
+        formatted_stats = []
+        for i, (stat, value) in enumerate(stats.items(), start=1):
+            if isinstance(value, dict):
+                sub_stats = "\n".join(
+                    f"    {sub_key}: {sub_value}"
+                    for sub_key, sub_value in value.items()
+                )
+                formatted_stats.append(f"{i}. {stat}:\n{sub_stats}")
+            else:
+                formatted_stats.append(f"{i}. {stat}: {value}")
+        return f"[blue]{title}[/blue]:\n" + "\n".join(formatted_stats)
+    else:
+        return f"[blue]{title}[/blue]: nil"
+def display_recipes(recipes_list: list) -> None:
+    """
+    Display the list of recipes in a tabular format.
+    This function takes a list of recipe dictionaries and displays each recipe's details in a table.
+    The table includes the recipe's ID, name, description, and associated details such as tags, categories,
+    datasets, prompt templates, metrics, attack strategies, grading scale, and statistics. If the list is empty,
+    it prints a message indicating that no recipes are found.
+    Args:
+        recipes_list (list): A list of dictionaries, where each dictionary contains the details of a recipe.
+    """
+    if recipes_list:
+        table = Table(
+            title="List of Recipes", show_lines=True, expand=True, header_style="bold"
+        )
+        table.add_column("No.", width=2)
+        table.add_column("Recipe", justify="left", width=78)
+        table.add_column("Contains", justify="left", width=20, overflow="fold")
+        for recipe_id, recipe in enumerate(recipes_list, 1):
+            (
+                id,
+                name,
+                description,
+                tags,
+                categories,
+                datasets,
+                prompt_templates,
+                metrics,
+                attack_strategies,
+                grading_scale,
+                stats,
+            ) = recipe.values()
+            tags_info = display_view_list_format("Tags", tags)
+            categories_info = display_view_list_format("Categories", categories)
+            datasets_info = display_view_list_format("Datasets", datasets)
+            prompt_templates_info = display_view_list_format(
+                "Prompt Templates", prompt_templates
+            )
+            metrics_info = display_view_list_format("Metrics", metrics)
+            attack_strategies_info = display_view_list_format(
+                "Attack Strategies", attack_strategies
+            )
+            grading_scale_info = display_view_grading_scale_format(
+                "Grading Scale", grading_scale
+            )
+            stats_info = display_view_statistics_format("Statistics", stats)
+            recipe_info = (
+                f"[red]id: {id}[/red]\n\n[blue]{name}[/blue]\n{description}\n\n"
+                f"{tags_info}\n\n{categories_info}\n\n{grading_scale_info}\n\n{stats_info}"
+            )
+            contains_info = f"{datasets_info}\n\n{prompt_templates_info}\n\n{metrics_info}\n\n{attack_strategies_info}"
+            table.add_section()
+            table.add_row(str(recipe_id), recipe_info, contains_info)
+        console.print(table)
+    else:
+        console.print("[red]There are no recipes found.[/red]")
+def show_recipe_results(recipes, endpoints, recipe_results, duration):
+    """
+    Show the results of the recipe benchmarking.
+    This function takes the recipes, endpoints, recipe results, results file, and duration as arguments.
+    If there are any recipe results, it generates a table to display them using the generate_recipe_table function.
+    It also prints the location of the results file and the time taken to run the benchmarking.
+    If there are no recipe results, it prints a message indicating that there are no results.
+    Args:
+        recipes (list): A list of recipes that were benchmarked.
+        endpoints (list): A list of endpoints that were used in the benchmarking.
+        recipe_results (dict): A dictionary with the results of the recipe benchmarking.
+        duration (float): The time taken to run the benchmarking in seconds.
+    Returns:
+        None
+    """
+    if recipe_results:
+        # Display recipe results
+        generate_recipe_table(recipes, endpoints, recipe_results)
+    else:
+        console.print("[red]There are no results.[/red]")
+    # Print run stats
+    console.print(
+        f"{'='*50}\n[blue]Time taken to run: {duration}s[/blue]\n*Overall rating will be the lowest grade that the recipes have in each cookbook\n{'='*50}"
+    )
+def generate_recipe_table(recipes: list, endpoints: list, results: dict) -> None:
+    """
+    Generate and display a table of recipe results.
+    This function creates a table that lists the results of running recipes against various endpoints.
+    Each row in the table corresponds to a recipe, and each column corresponds to an endpoint.
+    The results include the grade and average grade value for each recipe-endpoint pair.
+    Args:
+        recipes (list): A list of recipe IDs that were benchmarked.
+        endpoints (list): A list of endpoint IDs against which the recipes were run.
+        results (dict): A dictionary containing the results of the benchmarking.
+    Returns:
+        None: This function does not return anything. It prints the table to the console.
+    """
+    # Create a table with a title and headers
+    table = Table(
+        title="Recipes Result", show_lines=True, expand=True, header_style="bold"
+    )
+    table.add_column("No.", width=2)
+    table.add_column("Recipe", justify="left", width=78)
+    # Add a column for each endpoint
+    for endpoint in endpoints:
+        table.add_column(endpoint, justify="center")
+    # Iterate over each recipe and populate the table with results
+    for index, recipe_id in enumerate(recipes, start=1):
+        # Attempt to find the result for the current recipe
+        recipe_result = next(
+            (
+                result
+                for result in results["results"]["recipes"]
+                if result["id"] == recipe_id
+            ),
+            None,
+        )
+        # If the result exists, extract and format the results for each endpoint
+        if recipe_result:
+            endpoint_results = []
+            for endpoint in endpoints:
+                # Find the evaluation summary for the endpoint
+                evaluation_summary = next(
+                    (
+                        eval_summary
+                        for eval_summary in recipe_result["evaluation_summary"]
+                        if eval_summary["model_id"] == endpoint
+                    ),
+                    None,
+                )
+                # Format the grade and average grade value, or use "-" if not found
+                grade = "-"
+                if (
+                    evaluation_summary
+                    and "grade" in evaluation_summary
+                    and "avg_grade_value" in evaluation_summary
+                    and evaluation_summary["grade"]
+                ):
+                    grade = f"{evaluation_summary['grade']} [{evaluation_summary['avg_grade_value']}]"
+                endpoint_results.append(grade)
+            # Add a row for the recipe with its results
+            table.add_row(
+                str(index),
+                f"Recipe: [blue]{recipe_result['id']}[/blue]",
+                *endpoint_results,
+                end_section=True,
+            )
+        else:
+            # If no result is found, add a row with placeholders
+            table.add_row(
+                str(index),
+                f"Recipe: [blue]{recipe_id}[/blue]",
+                *(["-"] * len(endpoints)),
+                end_section=True,
+            )
+    # Print the table to the console
+    console.print(table)
+# ------------------------------------------------------------------------------
+# Cmd2 Arguments Parsers
+# ------------------------------------------------------------------------------
+# Add recipe arguments
+add_recipe_args = cmd2.Cmd2ArgumentParser(
+    description="Add a new recipe. The 'name' argument will be slugified to create a unique identifier.",
+    epilog="Example:\n add_recipe 'My new recipe' "
+    "'I am recipe description' "
+    "\"['category1','category2']\" "
+    "\"['bbq-lite-age-ambiguous']\" "
+    "\"['bertscore','bleuscore']\" "
+    "-p \"['analogical-similarity','mmlu']\" "
+    "-t \"['tag1','tag2']\" "
+    "-a \"['charswap_attack']\" "
+    "-g \"{'A':[80,100],'B':[60,79],'C':[40,59],'D':[20,39],'E':[0,19]}\" ",
+)
+add_recipe_args.add_argument("name", type=str, help="Name of the new recipe")
+add_recipe_args.add_argument(
+    "description", type=str, help="Description of the new recipe"
+)
+add_recipe_args.add_argument(
+    "-t",
+    "--tags",
+    type=str,
+    help="List of tags to be included in the new recipe",
+    nargs="?",
+)
+add_recipe_args.add_argument(
+    "categories", type=str, help="List of tags to be included in the new recipe"
+)
+add_recipe_args.add_argument("datasets", type=str, help="The dataset to be used")
+add_recipe_args.add_argument(
+    "-p",
+    "--prompt_templates",
+    type=str,
+    help="List of prompt templates to be included in the new recipe",
+    nargs="?",
+)
+add_recipe_args.add_argument(
+    "metrics", type=str, help="List of metrics to be included in the new recipe"
+)
+add_recipe_args.add_argument(
+    "-a",
+    "--attack_modules",
+    type=str,
+    help="List of attack modules to be included in the new recipe",
+    nargs="?",
+)
+add_recipe_args.add_argument(
+    "-g",
+    "--grading_scale",
+    type=str,
+    help="Dict of grading scale for the metric to be included in the new recipe",
+    nargs="?",
+)
+# Update recipe arguments
+update_recipe_args = cmd2.Cmd2ArgumentParser(
+    description="Update a recipe.",
+    epilog="Available keys for updating a recipe: \n"
+    "  name: The name of the recipe. \n"
+    "  description: The description of the recipe. \n"
+    "  tags: A list of tags associated with the recipe. \n"
+    "  categories: A list of categories used in the recipe. \n"
+    "  datasets: A list of datasets used in the recipe. \n"
+    "  prompt_templates: A list of prompt templates for the recipe. \n"
+    "  metrics: A list of metrics to evaluate the recipe. \n"
+    "  attack_modules: A list of attack modules used in the recipe.\n"
+    "  grading_scale: A list of grading scale used in the recipe. \n\n"
+    "Example command:\n"
+    "  update_recipe my-new-recipe \"[('name', 'My Updated Recipe'), ('tags', ['fairness', 'bbq'])]\" ",
+)
+update_recipe_args.add_argument("recipe", type=str, help="Id of the recipe")
+update_recipe_args.add_argument(
+    "update_values", type=str, help="Update recipe key/value"
+)
+# View recipe arguments
+view_recipe_args = cmd2.Cmd2ArgumentParser(
+    description="View a recipe.",
+    epilog="Example:\n view_recipe my-new-recipe",
+)
+view_recipe_args.add_argument("recipe", type=str, help="Id of the recipe")
+# Delete recipe arguments
+delete_recipe_args = cmd2.Cmd2ArgumentParser(
+    description="Delete a recipe.",
+    epilog="Example:\n delete_recipe my-new-recipe",
+)
+delete_recipe_args.add_argument("recipe", type=str, help="Id of the recipe")
+# Run recipe arguments
+run_recipe_args = cmd2.Cmd2ArgumentParser(
+    description="Run a recipe.",
+    epilog="Example:\n run_recipe "
+    '"my new recipe runner" '
+    "\"['bbq','mmlu']\" "
+    "\"['openai-gpt35-turbo']\" "
+    '-n 1 -r 1 -s "You are an intelligent AI" ',
+)
+run_recipe_args.add_argument("name", type=str, help="Name of recipe runner")
+run_recipe_args.add_argument("recipes", type=str, help="List of recipes to run")
+run_recipe_args.add_argument("endpoints", type=str, help="List of endpoints to run")
+run_recipe_args.add_argument(
+    "-n", "--num_of_prompts", type=int, default=0, help="Number of prompts to run"
+)
+run_recipe_args.add_argument(
+    "-r", "--random_seed", type=int, default=0, help="Random seed number"
+)
+run_recipe_args.add_argument(
+    "-s", "--system_prompt", type=str, default="", help="System Prompt to use"
+)
+run_recipe_args.add_argument(
+    "-l",
+    "--runner_proc_module",
+    type=str,
+    default="benchmarking",
+    help="Runner processing module to use",
+)
+run_recipe_args.add_argument(
+    "-o",
+    "--result_proc_module",
+    type=str,
+    default="benchmarking-result",
+    help="Result processing module to use",
+)