PyPI - aiverify-moonshot - Versions diffs - 0.4.7__py3-none-any.whl → 0.4.9__py3-none-any.whl - Mend

aiverify-moonshot 0.4.7py3-none-any.whl → 0.4.9py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (30) hide show

{aiverify_moonshot-0.4.7.dist-info → aiverify_moonshot-0.4.9.dist-info}/METADATA +3 -3
{aiverify_moonshot-0.4.7.dist-info → aiverify_moonshot-0.4.9.dist-info}/RECORD +29 -29
{aiverify_moonshot-0.4.7.dist-info → aiverify_moonshot-0.4.9.dist-info}/licenses/LICENSE.md +1 -1
aiverify_moonshot-0.4.9.dist-info/licenses/NOTICES.md +2506 -0
moonshot/__main__.py +93 -49
moonshot/api.py +12 -10
moonshot/integrations/cli/benchmark/metrics.py +8 -2
moonshot/integrations/cli/cli_errors.py +14 -0
moonshot/integrations/cli/common/common.py +14 -8
moonshot/integrations/cli/common/dataset.py +303 -65
moonshot/integrations/cli/redteam/attack_module.py +30 -1
moonshot/integrations/web_api/app.py +1 -1
moonshot/integrations/web_api/routes/dataset.py +52 -18
moonshot/integrations/web_api/schemas/cookbook_response_model.py +2 -0
moonshot/integrations/web_api/schemas/dataset_create_dto.py +14 -4
moonshot/integrations/web_api/schemas/recipe_response_model.py +1 -0
moonshot/integrations/web_api/services/cookbook_service.py +36 -9
moonshot/integrations/web_api/services/dataset_service.py +34 -9
moonshot/integrations/web_api/services/recipe_service.py +33 -3
moonshot/src/api/api_dataset.py +43 -11
moonshot/src/bookmark/bookmark.py +16 -9
moonshot/src/datasets/dataset.py +37 -45
moonshot/src/datasets/dataset_arguments.py +2 -1
moonshot/src/messages_constants.py +1 -0
moonshot/src/redteaming/attack/attack_module.py +40 -0
moonshot/src/storage/io_interface.py +18 -1
moonshot/src/storage/storage.py +57 -1
aiverify_moonshot-0.4.7.dist-info/licenses/NOTICES.md +0 -3340
{aiverify_moonshot-0.4.7.dist-info → aiverify_moonshot-0.4.9.dist-info}/WHEEL +0 -0
{aiverify_moonshot-0.4.7.dist-info → aiverify_moonshot-0.4.9.dist-info}/licenses/AUTHORS.md +0 -0

moonshot/integrations/cli/common/dataset.py CHANGED Viewed

@@ -2,118 +2,356 @@ from ast import literal_eval
 import cmd2
 from rich.console import Console
+from rich.table import Table
+from moonshot.api import (
+    api_delete_dataset,
+    api_get_all_datasets,
+    api_get_all_datasets_name,
+    api_convert_dataset,
+    api_download_dataset
+)
-from moonshot.api import api_create_datasets
 from moonshot.integrations.cli.cli_errors import (
-    ERROR_COMMON_ADD_DATASET_DESC_VALIDATION,
-    ERROR_COMMON_ADD_DATASET_LICENSE_VALIDATION,
-    ERROR_COMMON_ADD_DATASET_METHOD_VALIDATION,
-    ERROR_COMMON_ADD_DATASET_NAME_VALIDATION,
-    ERROR_COMMON_ADD_DATASET_PARAMS_VALIDATION,
-    ERROR_COMMON_ADD_DATASET_REFERENCE_VALIDATION,
+    ERROR_BENCHMARK_DELETE_DATASET_DATASET_VALIDATION,
+    ERROR_BENCHMARK_LIST_DATASETS_FIND_VALIDATION,
+    ERROR_BENCHMARK_LIST_DATASETS_PAGINATION_VALIDATION,
+    ERROR_BENCHMARK_LIST_DATASETS_PAGINATION_VALIDATION_1,
+    ERROR_BENCHMARK_VIEW_DATASET_DATASET_FILENAME_VALIDATION,
 )
-console = Console()
+from moonshot.integrations.cli.common.display_helper import display_view_str_format
+from moonshot.integrations.cli.utils.process_data import filter_data
+console = Console()
-def add_dataset(args) -> None:
+def list_datasets(args) -> list | None:
     """
-    Create a new dataset using the provided arguments and log the result.
+    List all available datasets.
-    This function attempts to create a new dataset by calling the `api_create_datasets`
-    function with the necessary parameters extracted from `args`. If successful, it logs
-    the creation of the dataset with its ID. If an exception occurs, it logs the error.
+    This function retrieves all available datasets by calling the api_get_all_datasets function from the
+    moonshot.api module. It then filters the datasets based on the provided keyword and pagination arguments.
+    If there are no datasets, it prints a message indicating that no datasets were found.
     Args:
-        args: An argparse.Namespace object containing the following attributes:
-            - name (str): Name of the new dataset.
-            - description (str): Description of the new dataset.
-            - reference (str): Reference URL for the new dataset.
-            - license (str): License type for the new dataset.
-            - method (str): Method to convert the new dataset ('hf' or 'csv').
-            - params (dict): Additional parameters for dataset creation.
+        args: A namespace object from argparse. It should have optional attributes:
+            find (str): Optional keyword to filter datasets.
+            pagination (str): Optional tuple to paginate datasets.
+    Returns:
+        list | None: A list of datasets or None if there are no datasets.
     """
     try:
-        if not isinstance(args.name, str) or not args.name or args.name is None:
-            raise TypeError(ERROR_COMMON_ADD_DATASET_NAME_VALIDATION)
+        print("Listing datasets may take a while...")
+        if args.find is not None:
+            if not isinstance(args.find, str) or not args.find:
+                raise TypeError(ERROR_BENCHMARK_LIST_DATASETS_FIND_VALIDATION)
-        if (
-            not isinstance(args.description, str)
-            or not args.description
-            or args.description is None
-        ):
-            raise TypeError(ERROR_COMMON_ADD_DATASET_DESC_VALIDATION)
+        if args.pagination is not None:
+            if not isinstance(args.pagination, str) or not args.pagination:
+                raise TypeError(ERROR_BENCHMARK_LIST_DATASETS_PAGINATION_VALIDATION)
+            try:
+                pagination = literal_eval(args.pagination)
+                if not (
+                    isinstance(pagination, tuple)
+                    and len(pagination) == 2
+                    and all(isinstance(i, int) for i in pagination)
+                ):
+                    raise ValueError(
+                        ERROR_BENCHMARK_LIST_DATASETS_PAGINATION_VALIDATION_1
+                    )
+            except (ValueError, SyntaxError):
+                raise ValueError(ERROR_BENCHMARK_LIST_DATASETS_PAGINATION_VALIDATION_1)
+        else:
+            pagination = ()
-        if (
-            not isinstance(args.reference, str)
-            or not args.reference
-            or args.reference is None
-        ):
-            raise TypeError(ERROR_COMMON_ADD_DATASET_REFERENCE_VALIDATION)
+        datasets_list = api_get_all_datasets()
+        keyword = args.find.lower() if args.find else ""
+        if datasets_list:
+            filtered_datasets_list = filter_data(datasets_list, keyword, pagination)
+            if filtered_datasets_list:
+                _display_datasets(filtered_datasets_list)
+                return filtered_datasets_list
+        console.print("[red]There are no datasets found.[/red]")
+        return None
+    except Exception as e:
+        print(f"[list_datasets]: {str(e)}")
+        return None
+def view_dataset(args) -> None:
+    """
+    View a specific dataset.
+    This function retrieves all available datasets and their names by calling the api_get_all_datasets and
+    api_get_all_datasets_name functions. It then finds the dataset with the name specified in args.dataset_filename
+    and displays it using the _display_datasets function. If an exception occurs, it prints an error message.
+    Args:
+        args: A namespace object from argparse. It should have the following attribute:
+            dataset_filename (str): The name of the dataset to view.
+    Returns:
+        None
+    """
+    try:
+        print("Viewing datasets may take a while...")
         if (
-            not isinstance(args.license, str)
-            or not args.license
-            or args.license is None
+            not isinstance(args.dataset_filename, str)
+            or not args.dataset_filename
+            or args.dataset_filename is None
         ):
-            raise TypeError(ERROR_COMMON_ADD_DATASET_LICENSE_VALIDATION)
+            raise TypeError(ERROR_BENCHMARK_VIEW_DATASET_DATASET_FILENAME_VALIDATION)
+        datasets_list = api_get_all_datasets()
+        datasets_name_list = api_get_all_datasets_name()
+        # Find the index of the dataset with the name args.dataset_filename
+        dataset_index = datasets_name_list.index(args.dataset_filename)
+        # Pass the corresponding dataset from datasets_list to _display_datasets
+        _display_datasets([datasets_list[dataset_index]])
+    except Exception as e:
+        print(f"[view_dataset]: {str(e)}")
+def delete_dataset(args) -> None:
+    """
+    Delete a dataset.
+    This function deletes a dataset with the specified name. It prompts the user for confirmation before proceeding
+    with the deletion. If the user confirms, it calls the api_delete_dataset function from the moonshot.api module to
+    delete the dataset. If the deletion is successful, it prints a confirmation message. If an exception occurs, it
+    prints an error message.
+    Args:
+        args: A namespace object from argparse. It should have the following attribute:
+            dataset (str): The name of the dataset to delete.
+    Returns:
+        None
+    """
+    # Confirm with the user before deleting a dataset
+    confirmation = console.input(
+        "[bold red]Are you sure you want to delete the dataset (y/N)? [/]"
+    )
+    if confirmation.lower() != "y":
+        console.print("[bold yellow]Dataset deletion cancelled.[/]")
+        return
+    try:
         if (
-            not isinstance(args.method, str)
-            or not args.method
-            or args.method is None
-            or args.method.lower() not in ["hf", "csv"]
+            args.dataset is None
+            or not isinstance(args.dataset, str)
+            or not args.dataset
         ):
-            raise TypeError(ERROR_COMMON_ADD_DATASET_METHOD_VALIDATION)
+            raise ValueError(ERROR_BENCHMARK_DELETE_DATASET_DATASET_VALIDATION)
-        if not isinstance(args.params, dict) or not args.params or args.params is None:
-            raise TypeError(ERROR_COMMON_ADD_DATASET_PARAMS_VALIDATION)
+        api_delete_dataset(args.dataset)
+        print("[delete_dataset]: Dataset deleted.")
+    except Exception as e:
+        print(f"[delete_dataset]: {str(e)}")
+def convert_dataset(args) -> None:
+    """
+    Convert an existing dataset to a new format.
-        new_dataset_id = api_create_datasets(
+    Args:
+        args: A namespace object from argparse with the following attributes:
+            - name (str): Name of the new dataset.
+            - description (str): Description of the new dataset.
+            - reference (str): Reference of the new dataset.
+            - license (str): License of the new dataset.
+            - csv_file_path (str): Path to the existing dataset file.
+    Returns:
+        None
+    """
+    try:
+        new_dataset_id = api_convert_dataset(
+            args.name,
+            args.description,
+            args.reference,
+            args.license,
+            args.csv_file_path,
+        )
+        print(f"[convert_dataset]: Dataset ({new_dataset_id}) created.")
+    except Exception as e:
+        print(f"[convert_dataset]: {str(e)}")
+def download_dataset(args) -> None:
+    """
+    Download a dataset from Hugging Face.
+    Args:
+        args: A namespace object from argparse with the following attributes:
+            - name (str): Name of the new dataset.
+            - description (str): Description of the new dataset.
+            - reference (str): Reference of the new dataset.
+            - license (str): License of the new dataset.
+            - params (dict): Parameters for the dataset in dictionary format.
+    Returns:
+        None
+    """
+    try:
+        new_dataset_id = api_download_dataset(
             args.name,
             args.description,
             args.reference,
             args.license,
-            args.method,
             **args.params,
         )
-        print(f"[add_dataset]: Dataset ({new_dataset_id}) created.")
+        print(f"[download_dataset]: Dataset ({new_dataset_id}) created.")
     except Exception as e:
-        print(f"[add_dataset]: {str(e)}")
+        print(f"[download_dataset]: {str(e)}")
+# ------------------------------------------------------------------------------
+# Helper functions: Display on cli
+# ------------------------------------------------------------------------------
+def _display_datasets(datasets_list: list):
+    """
+    Displays a list of datasets in a table format.
+    This function takes a list of datasets and displays them in a table format with each dataset's name, description,
+    and other relevant details. If the list is empty, it prints a message indicating that no datasets are found.
+    Args:
+        datasets_list (list): A list of dictionaries, where each dictionary contains the details of a dataset.
+    Returns:
+        None
+    """
+    table = Table(
+        title="List of Datasets", show_lines=True, expand=True, header_style="bold"
+    )
+    table.add_column("No.", width=2)
+    table.add_column("Dataset", justify="left", width=78)
+    for idx, dataset in enumerate(datasets_list, 1):
+        (
+            id,
+            name,
+            description,
+            _,
+            num_of_dataset_prompts,
+            created_date,
+            reference,
+            license,
+            *other_args,
+        ) = dataset.values()
+        idx = dataset.get("idx", idx)
+        prompt_info = display_view_str_format("Prompts", num_of_dataset_prompts)
+        created_date_info = display_view_str_format("Created Date", created_date)
+        license_info = display_view_str_format("License", license)
+        reference_info = display_view_str_format("Reference", reference)
+        dataset_info = (
+            f"[red]{id}[/red]\n\n[blue]{name}[/blue]\n{description}\n\n"
+            f"{prompt_info}\n\n{created_date_info}\n\n{license_info}\n\n{reference_info}"
+        )
+        table.add_section()
+        table.add_row(str(idx), dataset_info)
+    console.print(table)
 # ------------------------------------------------------------------------------
 # Cmd2 Arguments Parsers
 # ------------------------------------------------------------------------------
-# Add dataset arguments
-add_dataset_args = cmd2.Cmd2ArgumentParser(
-    description="Add a new dataset. The 'name' argument will be slugified to create a unique identifier.",
+# View dataset arguments
+view_dataset_args = cmd2.Cmd2ArgumentParser(
+    description="View a dataset file.",
+    epilog="Example:\n view_dataset bbq-lite-age-ambiguous",
+)
+view_dataset_args.add_argument(
+    "dataset_filename", type=str, help="Name of the dataset file"
+)
+# Delete dataset arguments
+delete_dataset_args = cmd2.Cmd2ArgumentParser(
+    description="Delete a dataset.",
+    epilog="Example:\n delete_dataset bbq-lite-age-ambiguous",
+)
+delete_dataset_args.add_argument("dataset", type=str, help="Name of the dataset")
+# List dataset arguments
+list_datasets_args = cmd2.Cmd2ArgumentParser(
+    description="List all datasets.",
+    epilog='Example:\n list_datasets -f "bbq"',
+)
+list_datasets_args.add_argument(
+    "-f",
+    "--find",
+    type=str,
+    help="Optional field to find dataset(s) with keyword",
+    nargs="?",
+)
+list_datasets_args.add_argument(
+    "-p",
+    "--pagination",
+    type=str,
+    help="Optional tuple to paginate dataset(s). E.g. (2,10) returns 2nd page with 10 items in each page.",
+    nargs="?",
+)
+# Convert dataset arguments
+convert_dataset_args = cmd2.Cmd2ArgumentParser(
+    description="Convert your dataset. The 'name' argument will be slugified to create a unique identifier.",
     epilog=(
         "Examples:\n"
-        "1. add_dataset 'dataset-name' 'A brief description' 'http://reference.com' 'MIT' 'csv' \"{'csv_file_path': '/path/to/your/file.csv'}\"\n"  # noqa: E501
-        "2. add_dataset 'dataset-name' 'A brief description' 'http://reference.com' 'MIT' 'hf' \"{'dataset_name': 'cais/mmlu', 'dataset_config': 'college_biology', 'split': 'test', 'input_col': ['question','choices'], 'target_col': 'answer'}\""  # noqa: E501
+        "convert_dataset 'dataset-name' 'A brief description' 'http://reference.com' 'MIT' '/path/to/your/file.csv'"
     ),
 )
-add_dataset_args.add_argument("name", type=str, help="Name of the new dataset")
-add_dataset_args.add_argument(
+convert_dataset_args.add_argument("name", type=str, help="Name of the new dataset")
+convert_dataset_args.add_argument(
     "description", type=str, help="Description of the new dataset"
 )
-add_dataset_args.add_argument(
+convert_dataset_args.add_argument(
     "reference", type=str, help="Reference of the new dataset"
 )
-add_dataset_args.add_argument("license", type=str, help="License of the new dataset")
-add_dataset_args.add_argument(
-    "method",
-    type=str,
-    choices=["hf", "csv"],
-    help="Method to convert the new dataset. Choose either 'hf' or 'csv'.",
+convert_dataset_args.add_argument(
+    "license", type=str, help="License of the new dataset"
+)
+convert_dataset_args.add_argument(
+    "csv_file_path", type=str, help="Path to your existing dataset"
+)
+# Download dataset arguments
+download_dataset_args = cmd2.Cmd2ArgumentParser(
+    description="Download dataset from Hugging Face. The 'name' argument will be slugified to create a unique ID.",
+    epilog=(
+        "Examples:\n"
+        "download_dataset 'dataset-name' 'A brief description' 'http://reference.com' 'MIT' "
+        "\"{'dataset_name': 'cais/mmlu', 'dataset_config': 'college_biology', 'split': 'dev', "
+        "'input_col': ['question','choices'], 'target_col': 'answer'}\""
+    ),
+)
+download_dataset_args.add_argument("name", type=str, help="Name of the new dataset")
+download_dataset_args.add_argument(
+    "description", type=str, help="Description of the new dataset"
+)
+download_dataset_args.add_argument(
+    "reference", type=str, help="Reference of the new dataset"
+)
+download_dataset_args.add_argument(
+    "license", type=str, help="License of the new dataset"
 )
-add_dataset_args.add_argument(
+download_dataset_args.add_argument(
     "params",
     type=literal_eval,
     help=(
         "Params of the new dataset in dictionary format. For example: \n"
         "1. For 'csv' method: \"{'csv_file_path': '/path/to/your/file.csv'}\"\n"
-        "2. For 'hf' method: \"{'dataset_name': 'cais_mmlu', 'dataset_config': 'college_biology', 'split': 'test', 'input_col': ['questions','choices'], 'target_col': 'answer'}\""  # noqa: E501
+        "2. For 'hf' method: \"{'dataset_name': 'cais_mmlu', 'dataset_config': 'college_biology', 'split': 'test', "
+        "'input_col': ['questions','choices'], 'target_col': 'answer'}\""
     ),
 )

moonshot/integrations/cli/redteam/attack_module.py CHANGED Viewed

@@ -5,6 +5,11 @@ from rich.console import Console
 from rich.table import Table
 from moonshot.api import api_delete_attack_module, api_get_all_attack_module_metadata
+from moonshot.integrations.cli.cli_errors import (
+    ERROR_RED_TEAMING_LIST_ATTACK_MODULES_FIND_VALIDATION,
+    ERROR_RED_TEAMING_LIST_ATTACK_MODULES_PAGINATION_VALIDATION,
+    ERROR_RED_TEAMING_LIST_ATTACK_MODULES_PAGINATION_VALIDATION_1,
+)
 from moonshot.integrations.cli.utils.process_data import filter_data
 console = Console()
@@ -28,6 +33,31 @@ def list_attack_modules(args) -> list | None:
     try:
         print("Listing attack modules may take a while...")
         attack_module_metadata_list = api_get_all_attack_module_metadata()
+        if args.find is not None:
+            if not isinstance(args.find, str) or not args.find:
+                raise TypeError(ERROR_RED_TEAMING_LIST_ATTACK_MODULES_FIND_VALIDATION)
+        if args.pagination is not None:
+            if not isinstance(args.pagination, str) or not args.pagination:
+                raise TypeError(
+                    ERROR_RED_TEAMING_LIST_ATTACK_MODULES_PAGINATION_VALIDATION
+                )
+            try:
+                pagination = literal_eval(args.pagination)
+                if not (
+                    isinstance(pagination, tuple)
+                    and len(pagination) == 2
+                    and all(isinstance(i, int) for i in pagination)
+                ):
+                    raise ValueError(
+                        ERROR_RED_TEAMING_LIST_ATTACK_MODULES_PAGINATION_VALIDATION_1
+                    )
+            except (ValueError, SyntaxError):
+                raise ValueError(
+                    ERROR_RED_TEAMING_LIST_ATTACK_MODULES_PAGINATION_VALIDATION_1
+                )
         keyword = args.find.lower() if args.find else ""
         pagination = literal_eval(args.pagination) if args.pagination else ()
@@ -41,7 +71,6 @@ def list_attack_modules(args) -> list | None:
         console.print("[red]There are no attack modules found.[/red]")
         return None
     except Exception as e:
         print(f"[list_attack_modules]: {str(e)}")

moonshot/integrations/web_api/app.py CHANGED Viewed

@@ -71,7 +71,7 @@ def create_app(cfg: providers.Configuration) -> CustomFastAPI:
     }
     app: CustomFastAPI = CustomFastAPI(
-        title="Project Moonshot", version="0.4.7", **app_kwargs
+        title="Project Moonshot", version="0.4.9", **app_kwargs
     )
     if cfg.cors.enabled():

moonshot/integrations/web_api/routes/dataset.py CHANGED Viewed

@@ -1,8 +1,8 @@
 from dependency_injector.wiring import Provide, inject
-from fastapi import APIRouter, Depends, HTTPException, Query
+from fastapi import APIRouter, Depends, HTTPException
 from ..container import Container
-from ..schemas.dataset_create_dto import DatasetCreateDTO
+from ..schemas.dataset_create_dto import CSV_Dataset_DTO, HF_Dataset_DTO
 from ..schemas.dataset_response_dto import DatasetResponseDTO
 from ..services.dataset_service import DatasetService
 from ..services.utils.exceptions_handler import ServiceException
@@ -10,27 +10,22 @@ from ..services.utils.exceptions_handler import ServiceException
 router = APIRouter(tags=["Datasets"])
-@router.post("/api/v1/datasets")
+@router.post("/api/v1/datasets/csv")
 @inject
-def create_dataset(
-    dataset_data: DatasetCreateDTO,
-    method: str = Query(
-        ...,
-        description="The method to use for creating the dataset. Supported methods are 'hf' and 'csv'.",
-    ),
+def convert_dataset(
+    dataset_data: CSV_Dataset_DTO,
     dataset_service: DatasetService = Depends(Provide[Container.dataset_service]),
 ) -> str:
     """
-    Create a new dataset using the specified method.
+    Convert a CSV dataset to the desired format.
     Args:
-        dataset_data (DatasetCreateDTO): The data required to create the dataset.
-        method (str): The method to use for creating the dataset. Supported methods are "hf" and "csv".
-        dataset_service (DatasetService, optional): The service responsible for creating the dataset.
+        dataset_data (CSV_Dataset_DTO): The data required to convert the dataset.
+        dataset_service (DatasetService, optional): The service responsible for converting the dataset.
         Defaults to Depends(Provide[Container.dataset_service]).
     Returns:
-        dict: A message indicating the dataset was created successfully.
+        str: The path to the newly created dataset.
     Raises:
         HTTPException: An error with status code 404 if the dataset file is not found.
@@ -38,19 +33,58 @@ def create_dataset(
                        An error with status code 500 for any other server-side error.
     """
     try:
-        return dataset_service.create_dataset(dataset_data, method)
+        return dataset_service.convert_dataset(dataset_data)
     except ServiceException as e:
         if e.error_code == "FileNotFound":
             raise HTTPException(
-                status_code=404, detail=f"Failed to retrieve datasets: {e.msg}"
+                status_code=404, detail=f"Failed to convert dataset: {e.msg}"
             )
         elif e.error_code == "ValidationError":
             raise HTTPException(
-                status_code=400, detail=f"Failed to retrieve datasets: {e.msg}"
+                status_code=400, detail=f"Failed to convert dataset: {e.msg}"
             )
         else:
             raise HTTPException(
-                status_code=500, detail=f"Failed to retrieve datasets: {e.msg}"
+                status_code=500, detail=f"Failed to convert dataset: {e.msg}"
+            )
+@router.post("/api/v1/datasets/hf")
+@inject
+def download_dataset(
+    dataset_data: HF_Dataset_DTO,
+    dataset_service: DatasetService = Depends(Provide[Container.dataset_service]),
+) -> str:
+    """
+    Download a dataset from Hugging Face using the provided dataset data.
+    Args:
+        dataset_data (HF_Dataset_DTO): The data required to download the dataset.
+        dataset_service (DatasetService, optional): The service responsible for downloading the dataset.
+        Defaults to Depends(Provide[Container.dataset_service]).
+    Returns:
+        str: The path to the newly downloaded dataset.
+    Raises:
+        HTTPException: An error with status code 404 if the dataset file is not found.
+                       An error with status code 400 if there is a validation error.
+                       An error with status code 500 for any other server-side error.
+    """
+    try:
+        return dataset_service.download_dataset(dataset_data)
+    except ServiceException as e:
+        if e.error_code == "FileNotFound":
+            raise HTTPException(
+                status_code=404, detail=f"Failed to download dataset: {e.msg}"
+            )
+        elif e.error_code == "ValidationError":
+            raise HTTPException(
+                status_code=400, detail=f"Failed to download dataset: {e.msg}"
+            )
+        else:
+            raise HTTPException(
+                status_code=500, detail=f"Failed to download dataset: {e.msg}"
             )

moonshot/integrations/web_api/schemas/cookbook_response_model.py CHANGED Viewed

@@ -7,3 +7,5 @@ from moonshot.src.cookbooks.cookbook_arguments import (
 class CookbookResponseModel(CookbookPydanticModel):
     total_prompt_in_cookbook: Optional[int] = None
+    total_dataset_in_cookbook: Optional[int] = None
+    endpoint_required: Optional[list[str]] = None

moonshot/integrations/web_api/schemas/dataset_create_dto.py CHANGED Viewed

@@ -8,11 +8,21 @@ from moonshot.src.datasets.dataset_arguments import (
 )
-class DatasetCreateDTO(DatasetPydanticModel):
-    id: Optional[str] = None
-    examples: Iterator[dict] = None
+class CSV_Dataset_DTO(DatasetPydanticModel):
+    id: Optional[str] = None  # Not a required from user
+    examples: Optional[Iterator[dict]] = None  # Not a required from user
     name: str = Field(..., min_length=1)
     description: str = Field(default="", min_length=1)
     license: Optional[str] = ""
     reference: Optional[str] = ""
-    params: dict
+    csv_file_path: str = Field(..., min_length=1)
+class HF_Dataset_DTO(DatasetPydanticModel):
+    id: Optional[str] = None  # Not a required from user
+    examples: Optional[Iterator[dict]] = None  # Not a required from user
+    name: str = Field(..., min_length=1)
+    description: str = Field(default="", min_length=1)
+    license: Optional[str] = ""
+    reference: Optional[str] = ""
+    params: dict = Field(..., min_length=1)

moonshot/integrations/web_api/schemas/recipe_response_model.py CHANGED Viewed

@@ -5,3 +5,4 @@ from moonshot.src.recipes.recipe_arguments import RecipeArguments as RecipePydan
 class RecipeResponseModel(RecipePydanticModel):
     total_prompt_in_recipe: Optional[int] = None
+    endpoint_required: Optional[list[str]] = None

aiverify-moonshot 0.4.7__py3-none-any.whl → 0.4.9__py3-none-any.whl

aiverify-moonshot 0.4.7py3-none-any.whl → 0.4.9py3-none-any.whl