PyPI - rapidata - Versions diffs - 2.21.5__py3-none-any.whl → 2.23.0__py3-none-any.whl - Mend

rapidata 2.21.5py3-none-any.whl → 2.23.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of rapidata might be problematic. Click here for more details.

Files changed (60) hide show

rapidata/__init__.py +5 -0
rapidata/api_client/__init__.py +8 -4
rapidata/api_client/api/__init__.py +1 -0
rapidata/api_client/api/evaluation_workflow_api.py +372 -0
rapidata/api_client/api/identity_api.py +268 -0
rapidata/api_client/api/rapid_api.py +353 -1987
rapidata/api_client/api/simple_workflow_api.py +6 -6
rapidata/api_client/models/__init__.py +7 -4
rapidata/api_client/models/add_campaign_model.py +25 -1
rapidata/api_client/models/add_validation_rapid_model_truth.py +24 -10
rapidata/api_client/models/compare_result.py +2 -0
rapidata/api_client/models/create_order_model.py +43 -2
rapidata/api_client/models/evaluation_workflow_model1.py +115 -0
rapidata/api_client/models/filter.py +2 -2
rapidata/api_client/models/get_validation_rapids_result.py +11 -4
rapidata/api_client/models/get_validation_rapids_result_truth.py +24 -10
rapidata/api_client/models/get_workflow_by_id_result_workflow.py +23 -9
rapidata/api_client/models/get_workflow_results_result.py +118 -0
rapidata/api_client/models/get_workflow_results_result_paged_result.py +105 -0
rapidata/api_client/models/google_one_tap_login_model.py +87 -0
rapidata/api_client/models/labeling_selection.py +22 -3
rapidata/api_client/models/logic_operator.py +1 -0
rapidata/api_client/models/rapid_response.py +3 -1
rapidata/api_client/models/retrieval_mode.py +38 -0
rapidata/api_client/models/root_filter.py +2 -2
rapidata/api_client/models/skip_truth.py +94 -0
rapidata/api_client/models/sticky_state.py +38 -0
rapidata/api_client/models/update_validation_rapid_model.py +11 -4
rapidata/api_client/models/update_validation_rapid_model_truth.py +24 -10
rapidata/api_client/rest.py +1 -0
rapidata/api_client_README.md +10 -11
rapidata/rapidata_client/__init__.py +7 -0
rapidata/rapidata_client/api/rapidata_exception.py +5 -3
rapidata/rapidata_client/assets/_media_asset.py +8 -1
rapidata/rapidata_client/assets/_multi_asset.py +6 -0
rapidata/rapidata_client/assets/_text_asset.py +6 -0
rapidata/rapidata_client/demographic/demographic_manager.py +2 -3
rapidata/rapidata_client/logging/__init__.py +2 -0
rapidata/rapidata_client/logging/logger.py +47 -0
rapidata/rapidata_client/logging/output_manager.py +16 -0
rapidata/rapidata_client/order/_rapidata_dataset.py +48 -33
rapidata/rapidata_client/order/_rapidata_order_builder.py +41 -19
rapidata/rapidata_client/order/rapidata_order.py +22 -13
rapidata/rapidata_client/order/rapidata_order_manager.py +84 -34
rapidata/rapidata_client/order/rapidata_results.py +2 -1
rapidata/rapidata_client/rapidata_client.py +6 -1
rapidata/rapidata_client/selection/__init__.py +1 -0
rapidata/rapidata_client/selection/labeling_selection.py +8 -2
rapidata/rapidata_client/selection/retrieval_modes.py +9 -0
rapidata/rapidata_client/settings/alert_on_fast_response.py +2 -1
rapidata/rapidata_client/settings/free_text_minimum_characters.py +2 -1
rapidata/rapidata_client/validation/rapidata_validation_set.py +2 -2
rapidata/rapidata_client/validation/rapids/rapids.py +3 -1
rapidata/rapidata_client/validation/validation_set_manager.py +39 -36
rapidata/service/credential_manager.py +22 -30
rapidata/service/openapi_service.py +11 -0
{rapidata-2.21.5.dist-info → rapidata-2.23.0.dist-info}/METADATA +2 -1
{rapidata-2.21.5.dist-info → rapidata-2.23.0.dist-info}/RECORD +60 -48
{rapidata-2.21.5.dist-info → rapidata-2.23.0.dist-info}/WHEEL +1 -1
{rapidata-2.21.5.dist-info → rapidata-2.23.0.dist-info}/LICENSE +0 -0

rapidata/rapidata_client/order/rapidata_order_manager.py CHANGED Viewed

@@ -5,7 +5,7 @@ from rapidata.service.openapi_service import OpenAPIService
 from rapidata.rapidata_client.assets.data_type_enum import RapidataDataTypes
 from rapidata.rapidata_client.order.rapidata_order import RapidataOrder
 from rapidata.rapidata_client.order._rapidata_order_builder import RapidataOrderBuilder
-from rapidata.rapidata_client.metadata import PromptMetadata, SelectWordsMetadata
+from rapidata.rapidata_client.metadata import PromptMetadata, SelectWordsMetadata, PrivateTextMetadata, Metadata
 from rapidata.rapidata_client.referee._naive_referee import NaiveReferee
 from rapidata.rapidata_client.referee._early_stopping_referee import EarlyStoppingReferee
 from rapidata.rapidata_client.selection._base_selection import RapidataSelection
@@ -34,6 +34,7 @@ from rapidata.api_client.models.page_info import PageInfo
 from rapidata.api_client.models.root_filter import RootFilter
 from rapidata.api_client.models.filter import Filter
 from rapidata.api_client.models.sort_criterion import SortCriterion
+from rapidata.rapidata_client.logging import logger
 from tqdm import tqdm
@@ -53,6 +54,7 @@ class RapidataOrderManager:
         self.settings = RapidataSettings
         self.selections = RapidataSelections
         self.__priority = 50
+        logger.debug("RapidataOrderManager initialized")
     def __get_selections(self, validation_set_id: str | None, labeling_amount=3) -> Sequence[RapidataSelection]:
         if validation_set_id:
@@ -71,7 +73,8 @@ class RapidataOrderManager:
             filters: Sequence[RapidataFilter] = [],
             settings: Sequence[RapidataSetting] = [],
             sentences: list[str] | None = None,
-            selections: Sequence[RapidataSelection] | None = None,
+            selections: Sequence[RapidataSelection] = [],
+            private_notes: list[str] | None = None,
             default_labeling_amount: int = 3
         ) -> RapidataOrder:
@@ -80,12 +83,12 @@ class RapidataOrderManager:
         if sentences and len(sentences) != len(assets):
             raise ValueError("Number of sentences must match number of datapoints")
+        if private_notes and len(private_notes) != len(assets):
+            raise ValueError("Number of private notes must match number of datapoints")
         if sentences and contexts:
             raise ValueError("You can only use contexts or sentences, not both")
-        if contexts and data_type == RapidataDataTypes.TEXT:
-            print("Warning: Contexts are not supported for text data type. Ignoring contexts.")
         if not confidence_threshold:
             referee = NaiveReferee(responses=responses_per_datapoint)
@@ -98,21 +101,32 @@ class RapidataOrderManager:
         order_builder = RapidataOrderBuilder(name=name, openapi_service=self._openapi_service)
         if selections and validation_set_id:
-            print("Warning: You provided both selections and validation_set_id. Ignoring validation_set_id.")
+            logger.warning("Warning: Both selections and validation_set_id provided. Ignoring validation_set_id.")
-        if selections is None:
+        if not selections:
             selections = self.__get_selections(validation_set_id, labeling_amount=default_labeling_amount)
         prompts_metadata = [PromptMetadata(prompt=prompt) for prompt in contexts] if contexts else None
         sentence_metadata = [SelectWordsMetadata(select_words=sentence) for sentence in sentences] if sentences else None
-        metadata = prompts_metadata or sentence_metadata or None
+        if prompts_metadata and sentence_metadata:
+            raise ValueError("You can only use contexts or sentences, not both")
+        metadata_list: Sequence[Metadata] = prompts_metadata or sentence_metadata or []
+        private_notes_metadata_list: Sequence[Metadata] = [PrivateTextMetadata(text=text) for text in private_notes] if private_notes else []
+        multi_metadata: Sequence[Sequence[Metadata]] = (
+            [[metadata, private_notes_metadata] for metadata, private_notes_metadata in zip(metadata_list, private_notes_metadata_list, strict=True)] if metadata_list and private_notes
+            else [[private_notes_metadata] for private_notes_metadata in private_notes_metadata_list] if private_notes
+            else [[metadata] for metadata in metadata_list] if metadata_list
+            else []
+        )
         order = (order_builder
                  ._workflow(workflow)
                  ._media(
-                     asset=assets,
-                     metadata=metadata
+                     assets=assets,
+                     multi_metadata=multi_metadata
                      )
                  ._referee(referee)
                  ._filters(filters)
@@ -138,7 +152,8 @@ class RapidataOrderManager:
             confidence_threshold: float | None = None,
             filters: Sequence[RapidataFilter] = [],
             settings: Sequence[RapidataSetting] = [],
-            selections: Sequence[RapidataSelection] | None = None,
+            selections: Sequence[RapidataSelection] = [],
+            private_notes: list[str] | None = None,
         ) -> RapidataOrder:
         """Create a classification order.
@@ -159,7 +174,10 @@ class RapidataOrderManager:
                 If provided, the classification datapoint will stop after the threshold is reached or at the number of responses, whatever happens first.
             filters (Sequence[RapidataFilter], optional): The list of filters for the classification. Defaults to []. Decides who the tasks should be shown to.
             settings (Sequence[RapidataSetting], optional): The list of settings for the classification. Defaults to []. Decides how the tasks should be shown.
-            selections (Sequence[RapidataSelection], optional): The list of selections for the classification. Defaults to None. Decides in what order the tasks should be shown.
+            selections (Sequence[RapidataSelection], optional): The list of selections for the classification. Defaults to []. Decides in what order the tasks should be shown.
+            private_notes (list[str], optional): The list of private notes for the classification. Defaults to None.
+                If provided has to be the same length as datapoints.\n
+                This will NOT be shown to the labelers but will be included in the result purely for your own reference.
         """
         if data_type == RapidataDataTypes.MEDIA:
@@ -183,7 +201,8 @@ class RapidataOrderManager:
             confidence_threshold=confidence_threshold,
             filters=filters,
             selections=selections,
-            settings=settings
+            settings=settings,
+            private_notes=private_notes
         )
     def create_compare_order(self,
@@ -197,7 +216,8 @@ class RapidataOrderManager:
             confidence_threshold: float | None = None,
             filters: Sequence[RapidataFilter] = [],
             settings: Sequence[RapidataSetting] = [],
-            selections: Sequence[RapidataSelection] | None = None,
+            selections: Sequence[RapidataSelection] = [],
+            private_notes: list[str] | None = None,
         ) -> RapidataOrder:
         """Create a compare order.
@@ -217,7 +237,10 @@ class RapidataOrderManager:
                 If provided, the comparison datapoint will stop after the threshold is reached or at the number of responses, whatever happens first.
             filters (Sequence[RapidataFilter], optional): The list of filters for the comparison. Defaults to []. Decides who the tasks should be shown to.
             settings (Sequence[RapidataSetting], optional): The list of settings for the comparison. Defaults to []. Decides how the tasks should be shown.
-            selections (Sequence[RapidataSelection], optional): The list of selections for the comparison. Defaults to None. Decides in what order the tasks should be shown.
+            selections (Sequence[RapidataSelection], optional): The list of selections for the comparison. Defaults to []. Decides in what order the tasks should be shown.
+            private_notes (list[str], optional): The list of private notes for the comparison. Defaults to None.\n
+                If provided has to be the same length as datapoints.\n
+                This will NOT be shown to the labelers but will be included in the result purely for your own reference.
         """
         if data_type == RapidataDataTypes.MEDIA:
@@ -240,7 +263,8 @@ class RapidataOrderManager:
             confidence_threshold=confidence_threshold,
             filters=filters,
             selections=selections,
-            settings=settings
+            settings=settings,
+            private_notes=private_notes
         )
     def create_ranking_order(self,
@@ -255,7 +279,7 @@ class RapidataOrderManager:
                              validation_set_id: Optional[str] = None,
                              filters: Sequence[RapidataFilter] = [],
                              settings: Sequence[RapidataSetting] = [],
-                             selections: Optional[Sequence[RapidataSelection]] = None
+                             selections: Sequence[RapidataSelection] = []
                              ) -> RapidataOrder:
         """
         Create a ranking order.
@@ -276,7 +300,7 @@ class RapidataOrderManager:
                 If provided, one validation task will be shown infront of the datapoints that will be labeled.
             filters (Sequence[RapidataFilter], optional): The list of filters for the order. Defaults to []. Decides who the tasks should be shown to.
             settings (Sequence[RapidataSetting], optional): The list of settings for the order. Defaults to []. Decides how the tasks should be shown.
-            selections (Sequence[RapidataSelection], optional): The list of selections for the order. Defaults to None. Decides in what order the tasks should be shown.
+            selections (Sequence[RapidataSelection], optional): The list of selections for the order. Defaults to []. Decides in what order the tasks should be shown.
         """
         if data_type == RapidataDataTypes.MEDIA:
@@ -299,7 +323,7 @@ class RapidataOrderManager:
             validation_set_id=validation_set_id,
             filters=filters,
             selections=selections,
-            settings=settings
+            settings=settings,
         )
     def create_free_text_order(self,
@@ -310,7 +334,8 @@ class RapidataOrderManager:
             responses_per_datapoint: int = 10,
             filters: Sequence[RapidataFilter] = [],
             settings: Sequence[RapidataSetting] = [],
-            selections: Sequence[RapidataSelection] | None = None,
+            selections: Sequence[RapidataSelection] = [],
+            private_notes: list[str] | None = None,
         ) -> RapidataOrder:
         """Create a free text order.
@@ -323,7 +348,10 @@ class RapidataOrderManager:
             responses_per_datapoint (int, optional): The number of responses that will be collected per datapoint. Defaults to 10.
             filters (Sequence[RapidataFilter], optional): The list of filters for the free text. Defaults to []. Decides who the tasks should be shown to.
             settings (Sequence[RapidataSetting], optional): The list of settings for the free text. Defaults to []. Decides how the tasks should be shown.
-            selections (Sequence[RapidataSelection], optional): The list of selections for the free text. Defaults to None. Decides in what order the tasks should be shown.
+            selections (Sequence[RapidataSelection], optional): The list of selections for the free text. Defaults to []. Decides in what order the tasks should be shown.
+            private_notes (list[str], optional): The list of private notes for the free text. Defaults to None.\n
+                If provided has to be the same length as datapoints.\n
+                This will NOT be shown to the labelers but will be included in the result purely for your own reference.
         """
         if data_type == RapidataDataTypes.MEDIA:
@@ -344,7 +372,8 @@ class RapidataOrderManager:
             filters=filters,
             selections=selections,
             settings=settings,
-            default_labeling_amount=1
+            default_labeling_amount=1,
+            private_notes=private_notes
         )
     def create_select_words_order(self,
@@ -356,7 +385,8 @@ class RapidataOrderManager:
             validation_set_id: str | None = None,
             filters: Sequence[RapidataFilter] = [],
             settings: Sequence[RapidataSetting] = [],
-            selections: Sequence[RapidataSelection] | None = None,
+            selections: Sequence[RapidataSelection] = [],
+            private_notes: list[str] | None = None,
         ) -> RapidataOrder:
         """Create a select words order.
@@ -371,7 +401,10 @@ class RapidataOrderManager:
                 If provided, one validation task will be shown infront of the datapoints that will be labeled.
             filters (Sequence[RapidataFilter], optional): The list of filters for the select words. Defaults to []. Decides who the tasks should be shown to.
             settings (Sequence[RapidataSetting], optional): The list of settings for the select words. Defaults to []. Decides how the tasks should be shown.
-            selections (Sequence[RapidataSelection], optional): The list of selections for the select words. Defaults to None. Decides in what order the tasks should be shown.
+            selections (Sequence[RapidataSelection], optional): The list of selections for the select words. Defaults to []. Decides in what order the tasks should be shown.
+            private_notes (list[str], optional): The list of private notes for the select words. Defaults to None.\n
+                If provided has to be the same length as datapoints.\n
+                This will NOT be shown to the labelers but will be included in the result purely for your own reference.
         """
         assets = [MediaAsset(path=path) for path in datapoints]
@@ -388,7 +421,8 @@ class RapidataOrderManager:
             selections=selections,
             settings=settings,
             sentences=sentences,
-            default_labeling_amount=2
+            default_labeling_amount=2,
+            private_notes=private_notes
         )
     def create_locate_order(self,
@@ -400,7 +434,8 @@ class RapidataOrderManager:
             validation_set_id: str | None = None,
             filters: Sequence[RapidataFilter] = [],
             settings: Sequence[RapidataSetting] = [],
-            selections: Sequence[RapidataSelection] | None = None,
+            selections: Sequence[RapidataSelection] = [],
+            private_notes: list[str] | None = None,
         ) -> RapidataOrder:
         """Create a locate order.
@@ -416,7 +451,10 @@ class RapidataOrderManager:
                 If provided, one validation task will be shown infront of the datapoints that will be labeled.
             filters (Sequence[RapidataFilter], optional): The list of filters for the locate. Defaults to []. Decides who the tasks should be shown to.
             settings (Sequence[RapidataSetting], optional): The list of settings for the locate. Defaults to []. Decides how the tasks should be shown.
-            selections (Sequence[RapidataSelection], optional): The list of selections for the locate. Defaults to None. Decides in what order the tasks should be shown.
+            selections (Sequence[RapidataSelection], optional): The list of selections for the locate. Defaults to []. Decides in what order the tasks should be shown.
+            private_notes (list[str], optional): The list of private notes for the locate. Defaults to None.\n
+                If provided has to be the same length as datapoints.\n
+                This will NOT be shown to the labelers but will be included in the result purely for your own reference.
         """
         assets = [MediaAsset(path=path) for path in datapoints]
@@ -430,7 +468,8 @@ class RapidataOrderManager:
             validation_set_id=validation_set_id,
             filters=filters,
             selections=selections,
-            settings=settings
+            settings=settings,
+            private_notes=private_notes
         )
     def create_draw_order(self,
@@ -442,7 +481,8 @@ class RapidataOrderManager:
             validation_set_id: str | None = None,
             filters: Sequence[RapidataFilter] = [],
             settings: Sequence[RapidataSetting] = [],
-            selections: Sequence[RapidataSelection] | None = None,
+            selections: Sequence[RapidataSelection] = [],
+            private_notes: list[str] | None = None,
         ) -> RapidataOrder:
         """Create a draw order.
@@ -458,7 +498,10 @@ class RapidataOrderManager:
                 If provided, one validation task will be shown infront of the datapoints that will be labeled.
             filters (Sequence[RapidataFilter], optional): The list of filters for the draw lines. Defaults to []. Decides who the tasks should be shown to.
             settings (Sequence[RapidataSetting], optional): The list of settings for the draw lines. Defaults to []. Decides how the tasks should be shown.
-            selections (Sequence[RapidataSelection], optional): The list of selections for the draw lines. Defaults to None. Decides in what order the tasks should be shown.
+            selections (Sequence[RapidataSelection], optional): The list of selections for the draw lines. Defaults to []. Decides in what order the tasks should be shown.
+            private_notes (list[str], optional): The list of private notes for the draw lines. Defaults to None.\n
+                If provided has to be the same length as datapoints.\n
+                This will NOT be shown to the labelers but will be included in the result purely for your own reference.
         """
         assets = [MediaAsset(path=path) for path in datapoints]
@@ -472,7 +515,8 @@ class RapidataOrderManager:
             validation_set_id=validation_set_id,
             filters=filters,
             selections=selections,
-            settings=settings
+            settings=settings,
+            private_notes=private_notes
         )
     def create_timestamp_order(self,
@@ -484,7 +528,8 @@ class RapidataOrderManager:
             validation_set_id: str | None = None,
             filters: Sequence[RapidataFilter] = [],
             settings: Sequence[RapidataSetting] = [],
-            selections: Sequence[RapidataSelection] | None = None,
+            selections: Sequence[RapidataSelection] = [],
+            private_notes: list[str] | None = None,
         ) -> RapidataOrder:
         """Create a timestamp order.
@@ -497,9 +542,13 @@ class RapidataOrderManager:
                 If provided has to be the same length as datapoints and will be shown in addition to the instruction. (Therefore will be different for each datapoint)
                 Will be match up with the datapoints using the list index.
             validation_set_id (str, optional): The ID of the validation set. Defaults to None.\n
+                If provided, one validation task will be shown infront of the datapoints that will be labeled.
             filters (Sequence[RapidataFilter], optional): The list of filters for the timestamp. Defaults to []. Decides who the tasks should be shown to.
             settings (Sequence[RapidataSetting], optional): The list of settings for the timestamp. Defaults to []. Decides how the tasks should be shown.
-            selections (Sequence[RapidataSelection], optional): The list of selections for the timestamp. Defaults to None. Decides in what order the tasks should be shown.
+            selections (Sequence[RapidataSelection], optional): The list of selections for the timestamp. Defaults to []. Decides in what order the tasks should be shown.
+            private_notes (list[str], optional): The list of private notes for the timestamp. Defaults to None.\n
+                If provided has to be the same length as datapoints.\n
+                This will NOT be shown to the labelers but will be included in the result purely for your own reference.
         """
         assets = [MediaAsset(path=path) for path in datapoints]
@@ -520,7 +569,8 @@ class RapidataOrderManager:
             filters=filters,
             selections=selections,
             settings=settings,
-            default_labeling_amount=2
+            default_labeling_amount=2,
+            private_notes=private_notes
         )
     def get_order_by_id(self, order_id: str) -> RapidataOrder:

rapidata/rapidata_client/order/rapidata_results.py CHANGED Viewed

@@ -2,6 +2,7 @@ import pandas as pd
 from typing import Any
 from pandas.core.indexes.base import Index
 import json
+from rapidata.rapidata_client.logging import managed_print
 class RapidataResults(dict):
     """
@@ -32,7 +33,7 @@ class RapidataResults(dict):
             return pd.DataFrame()
         if self["info"].get("orderType") is None:
-            print("Warning: Results are old and Order type is not specified. Dataframe might be wrong.")
+            managed_print("Warning: Results are old and Order type is not specified. Dataframe might be wrong.")
         # Check for detailed results if split_details is True
         if split_details:

rapidata/rapidata_client/rapidata_client.py CHANGED Viewed

@@ -8,6 +8,7 @@ from rapidata.rapidata_client.validation.validation_set_manager import (
 from rapidata.rapidata_client.demographic.demographic_manager import DemographicManager
+from rapidata.rapidata_client.logging import logger
 class RapidataClient:
     """The Rapidata client is the main entry point for interacting with the Rapidata API. It allows you to create orders and validation sets."""
@@ -38,6 +39,7 @@ class RapidataClient:
             order (RapidataOrderManager): The RapidataOrderManager instance.
             validation (ValidationSetManager): The ValidationSetManager instance.
         """
+        logger.debug("Initializing OpenAPIService")
         self._openapi_service = OpenAPIService(
             client_id=client_id,
             client_secret=client_secret,
@@ -48,12 +50,15 @@ class RapidataClient:
             leeway=leeway,
         )
+        logger.debug("Initializing RapidataOrderManager")
         self.order = RapidataOrderManager(openapi_service=self._openapi_service)
+        logger.debug("Initializing ValidationSetManager")
         self.validation = ValidationSetManager(openapi_service=self._openapi_service)
+        logger.debug("Initializing DemographicManager")
         self._demographic = DemographicManager(openapi_service=self._openapi_service)
     def reset_credentials(self):
         """Reset the credentials saved in the configuration file for the current environment."""
         self._openapi_service.reset_credentials()

rapidata/rapidata_client/selection/__init__.py CHANGED Viewed

@@ -7,3 +7,4 @@ from .capped_selection import CappedSelection
 from .shuffling_selection import ShufflingSelection
 from .ab_test_selection import AbTestSelection
 from .static_selection import StaticSelection
+from .retrieval_modes import RetrievalMode

rapidata/rapidata_client/selection/labeling_selection.py CHANGED Viewed

@@ -1,5 +1,6 @@
 from typing import Any
 from rapidata.rapidata_client.selection._base_selection import RapidataSelection
+from rapidata.rapidata_client.selection.retrieval_modes import RetrievalMode
 from rapidata.api_client.models.labeling_selection import (
     LabelingSelection as LabelingSelectionModel,
 )
@@ -12,10 +13,15 @@ class LabelingSelection(RapidataSelection):
     Args:
         amount (int): The amount of labeling rapids that will be shown per session.
+        retrieval_mode (RetrievalMode): The retrieval mode to use. Defaults to "Random".
+        max_iterations (int | None): The maximum number an annotator can see the same task. Defaults to None.
+            This parameter is only taken into account when using "Shuffled" or "Sequential" retrieval modes.
     """
-    def __init__(self, amount: int):
+    def __init__(self, amount: int, retrieval_mode: RetrievalMode = RetrievalMode.Random, max_iterations: int | None = None):
         self.amount = amount
+        self.retrieval_mode = retrieval_mode
+        self.max_iterations = max_iterations
     def _to_model(self) -> Any:
-        return LabelingSelectionModel(_t="LabelingSelection", amount=self.amount)
+        return LabelingSelectionModel(_t="LabelingSelection", amount=self.amount, retrievalMode=self.retrieval_mode.value, maxIterations=self.max_iterations)

rapidata/rapidata_client/selection/retrieval_modes.py ADDED Viewed

@@ -0,0 +1,9 @@
+from enum import Enum
+class RetrievalMode(Enum):
+    # Will just randomly shuffle the datapoints. This is the default and will NOT take into account the "max_iterations" parameter.
+    Random = "Random"
+    # Will shuffle the datapoints randomly for each user. The user will then see the datapoints in that order. This will take into account the "max_iterations" parameter.
+    Shuffled = "Shuffled"
+    # Will show the datapoints in the order they are in the dataset. This will take into account the "max_iterations" parameter.
+    Sequential = "Sequential"

rapidata/rapidata_client/settings/alert_on_fast_response.py CHANGED Viewed

@@ -1,4 +1,5 @@
 from rapidata.rapidata_client.settings._rapidata_setting import RapidataSetting
+from rapidata.rapidata_client.logging import managed_print
 class AlertOnFastResponse(RapidataSetting):
     """
@@ -12,7 +13,7 @@ class AlertOnFastResponse(RapidataSetting):
         if not isinstance(threshold, int):
             raise ValueError("The alert must be an integer.")
         if threshold < 10:
-            print(f"Warning: Are you sure you want to set the threshold so low ({threshold} milliseconds)?")
+            managed_print(f"Warning: Are you sure you want to set the threshold so low ({threshold} milliseconds)?")
         if threshold > 25000:
             raise ValueError("The alert must be less than 25000 milliseconds.")
         if threshold < 0:

rapidata/rapidata_client/settings/free_text_minimum_characters.py CHANGED Viewed

@@ -1,4 +1,5 @@
 from rapidata.rapidata_client.settings._rapidata_setting import RapidataSetting
+from rapidata.rapidata_client.logging import managed_print, logger
 class FreeTextMinimumCharacters(RapidataSetting):
     """
@@ -12,5 +13,5 @@ class FreeTextMinimumCharacters(RapidataSetting):
         if value < 1:
             raise ValueError("The minimum number of characters must be greater than or equal to 1.")
         if value > 40:
-            print(f"Warning: Are you sure you want to set the minimum number of characters at {value}?")
+            managed_print(f"Warning: Are you sure you want to set the minimum number of characters at {value}?")
         super().__init__(key="free_text_minimum_characters", value=value)

rapidata/rapidata_client/validation/rapidata_validation_set.py CHANGED Viewed

@@ -1,7 +1,6 @@
 from rapidata.rapidata_client.validation.rapids.rapids import Rapid
 from rapidata.service.openapi_service import OpenAPIService
-from requests.adapters import HTTPAdapter, Retry
-import requests
+from rapidata.rapidata_client.logging import logger
 from rapidata.api_client.models.update_dimensions_model import UpdateDimensionsModel
 from rapidata.rapidata_client.assets._sessions import SessionManager
@@ -37,6 +36,7 @@ class RapidataValidationSet:
         Args:
             dimensions (list[str]): The new dimensions of the validation set.
         """
+        logger.debug(f"Updating dimensions for validation set {self.id} to {dimensions}")
         self.__openapi_service.validation_api.validation_validation_set_id_dimensions_patch(self.id, UpdateDimensionsModel(dimensions=dimensions))
         return self

rapidata/rapidata_client/validation/rapids/rapids.py CHANGED Viewed

@@ -19,7 +19,8 @@ from rapidata.api_client.models.create_datapoint_from_files_model_metadata_inner
 from rapidata.service.openapi_service import OpenAPIService
-import requests
+from rapidata.rapidata_client.logging import logger
 class Rapid():
     def __init__(self, asset: MediaAsset | TextAsset | MultiAsset, metadata: Sequence[Metadata], payload: Any, truth: Any, randomCorrectProbability: float, explanation: str | None):
@@ -29,6 +30,7 @@ class Rapid():
         self.truth = truth
         self.randomCorrectProbability = randomCorrectProbability
         self.explanation = explanation
+        logger.debug(f"Created Rapid with asset: {self.asset}, metadata: {self.metadata}, payload: {self.payload}, truth: {self.truth}, randomCorrectProbability: {self.randomCorrectProbability}, explanation: {self.explanation}")
     def _add_to_validation_set(self, validationSetId: str, openapi_service: OpenAPIService) -> None:
         if isinstance(self.asset, TextAsset) or (isinstance(self.asset, MultiAsset) and isinstance(self.asset.assets[0], TextAsset)):

rapidata 2.21.5__py3-none-any.whl → 2.23.0__py3-none-any.whl

Potentially problematic release.

rapidata 2.21.5py3-none-any.whl → 2.23.0py3-none-any.whl