PyPI - rapidata - Versions diffs - 2.8.0__py3-none-any.whl → 2.9.0__py3-none-any.whl - Mend

rapidata 2.8.0py3-none-any.whl → 2.9.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of rapidata might be problematic. Click here for more details.

Files changed (7) hide show

rapidata/rapidata_client/order/rapidata_order.py CHANGED Viewed

@@ -8,6 +8,7 @@ from typing import Optional, cast, Any
 from rapidata.api_client.models.workflow_artifact_model import WorkflowArtifactModel
 from rapidata.api_client.models.preliminary_download_model import PreliminaryDownloadModel
 from tqdm import tqdm
+from rapidata.rapidata_client.order.rapidata_results import RapidataResults
 class RapidataOrder:
     """
@@ -154,13 +155,13 @@ class RapidataOrder:
         return progress
-    def __get_preliminary_results(self) -> dict[str, Any]:
+    def __get_preliminary_results(self) -> RapidataResults:
         pipeline_id = self.__get_pipeline_id()
         try:
             download_id = self.__openapi_service.pipeline_api.pipeline_pipeline_id_preliminary_download_post(pipeline_id, PreliminaryDownloadModel(sendEmail=False)).download_id
             while not (preliminary_results := self.__openapi_service.pipeline_api.pipeline_preliminary_download_preliminary_download_id_get(preliminary_download_id=download_id)):
                 sleep(1)
-            return json.loads(preliminary_results.decode())
+            return RapidataResults(json.loads(preliminary_results.decode()))
         except ApiException as e:
             # Handle API exceptions
@@ -169,7 +170,7 @@ class RapidataOrder:
             # Handle JSON parsing errors
             raise Exception(f"Failed to parse preliminary order results: {str(e)}") from e
-    def get_results(self, preliminary_results=False) -> dict[str, Any]:
+    def get_results(self, preliminary_results: bool=False) -> RapidataResults:
         """
         Gets the results of the order.
         If the order is still processing, this method will block until the order is completed and then return the results.
@@ -194,7 +195,7 @@ class RapidataOrder:
         try:
             # Get the raw result string
-            return self.__openapi_service.order_api.order_get_order_results_get(id=self.order_id) # type: ignore
+            return RapidataResults(self.__openapi_service.order_api.order_get_order_results_get(id=self.order_id)) # type: ignore
         except ApiException as e:
             # Handle API exceptions

rapidata/rapidata_client/order/rapidata_results.py ADDED Viewed

@@ -0,0 +1,143 @@
+import pandas as pd
+from typing import Any
+from pandas.core.indexes.base import Index
+import json
+class RapidataResults(dict):
+    """
+    A specialized dictionary class for handling Rapidata API results.
+    Extends the built-in dict class with specialized methods.
+    """
+    def to_pandas(self) -> pd.DataFrame:
+        """
+        Converts the results to a pandas DataFrame.
+        For Compare results, creates standardized A/B columns for metrics like:
+        - aggregatedResults
+        - aggregatedResultsRatios
+        - summedUserScores
+        - summedUserScoresRatios
+        For regular results, flattens nested dictionaries into columns with underscore-separated names.
+        Returns:
+            pd.DataFrame: A DataFrame containing the processed results
+        """
+        if "results" not in self or not self["results"]:
+            return pd.DataFrame()
+        if self["info"].get("orderType") == "Compare":
+            return self._compare_to_pandas()
+        if self["info"].get("orderType") is None:
+            print("Warning: Results are old and Order type is not specified. Dataframe might be wrong.")
+        # Get the structure from first item
+        first_item = self["results"][0]
+        columns = []
+        path_map = {}  # Maps flattened column names to paths to reach the values
+        # Build the column structure once
+        self._build_column_structure(first_item, columns, path_map)
+        # Extract data using the known structure
+        data = []
+        for item in self["results"]:
+            row = []
+            for path in path_map.values():
+                value = self._get_value_from_path(item, path)
+                row.append(value)
+            data.append(row)
+        return pd.DataFrame(data, columns=Index(columns))
+    def _build_column_structure(
+        self,
+        d: dict[str, Any],
+        columns: list[str],
+        path_map: dict[str, list[str]],
+        parent_key: str = '',
+        current_path: list[str] | None = None
+    ) -> None:
+        """
+        Builds the column structure and paths to reach values in nested dictionaries.
+        Args:
+            d: The dictionary to analyze
+            columns: List to store column names
+            path_map: Dictionary mapping column names to paths for accessing values
+            parent_key: The parent key for nested dictionaries
+            current_path: The current path in the dictionary structure
+        """
+        if current_path is None:
+            current_path = []
+        for key, value in d.items():
+            new_key = f"{parent_key}_{key}" if parent_key else key
+            new_path: list[str] = current_path + [key]
+            if isinstance(value, dict):
+                self._build_column_structure(value, columns, path_map, new_key, new_path)
+            else:
+                columns.append(new_key)
+                path_map[new_key] = new_path
+    def _get_value_from_path(self, d: dict[str, Any], path: list[str]) -> Any:
+        """
+        Retrieves a value from a nested dictionary using a path list.
+        Args:
+            d: The dictionary to retrieve the value from
+            path: List of keys forming the path to the desired value
+        Returns:
+            The value at the specified path, or None if the path doesn't exist
+        """
+        for key in path[:-1]:
+            d = d.get(key, {})
+        return d.get(path[-1])
+    def _compare_to_pandas(self):
+        """
+        Converts Compare results to a pandas DataFrame dynamically.
+        """
+        if not self.get("results"):
+            return pd.DataFrame()
+        rows = []
+        for result in self["results"]:
+            # Get the image names from the first metric we find
+            for key in result:
+                if isinstance(result[key], dict) and len(result[key]) == 2:
+                    assets = list(result[key].keys())
+                    break
+            else:
+                continue
+            asset_a, asset_b = assets[0], assets[1]
+            # Initialize row with non-comparative fields
+            row = {
+                key: value for key, value in result.items()
+                if not isinstance(value, dict)
+            }
+            # Handle comparative metrics
+            for key, values in result.items():
+                if isinstance(values, dict) and len(values) == 2:
+                    row[f'A_{key}'] = values[asset_a]
+                    row[f'B_{key}'] = values[asset_b]
+            rows.append(row)
+        return pd.DataFrame(rows)
+    def to_json(self, path: str="./results.json"):
+        """
+        Saves the results to a JSON file.
+        Args:
+            path: The file path where the JSON should be saved. Defaults to "./results.json".
+        """
+        with open(path, 'w') as f:
+            json.dump(self, f)

rapidata/rapidata_client/validation/validation_set_manager.py CHANGED Viewed

@@ -47,7 +47,7 @@ class ValidationSetManager:
             instruction (str): The instruction by which the labeler will answer.
             answer_options (list[str]): The options to choose from when answering.
             datapoints (list[str]): The datapoints that will be used for validation.
-            truths (list[list[str]]): The truths for each datapoint. Outher list is for each datapoint, inner list is for each truth.\n
+            truths (list[list[str]]): The truths for each datapoint. Outer list is for each datapoint, inner list is for each truth.\n
                 example:
                     options: ["yes", "no", "maybe"]
                     datapoints: ["datapoint1", "datapoint2"]
@@ -161,7 +161,7 @@ class ValidationSetManager:
         Args:
             name (str): The name of the validation set. (will not be shown to the labeler)
             instruction (str): The instruction to show to the labeler.
-            truths (list[list[int]]): The truths for each datapoint. Outher list is for each datapoint, inner list is for each truth.\n
+            truths (list[list[int]]): The truths for each datapoint. Outer list is for each datapoint, inner list is for each truth.\n
                 example:
                     datapoints: ["datapoint1", "datapoint2"]
                     sentences: ["this example 1", "this example 2"]
@@ -214,7 +214,7 @@ class ValidationSetManager:
         Args:
             name (str): The name of the validation set. (will not be shown to the labeler)
             instruction (str): The instruction to show to the labeler.
-            truths (list[list[Box]]): The truths for each datapoint. Outher list is for each datapoint, inner list is for each truth.\n
+            truths (list[list[Box]]): The truths for each datapoint. Outer list is for each datapoint, inner list is for each truth.\n
                 example:
                     datapoints: ["datapoint1", "datapoint2"]
                     truths: [[Box(0, 0, 100, 100)], [Box(50, 50, 150, 150)]] -> first datapoint the object is in the top left corner, second datapoint the object is in the center
@@ -266,7 +266,7 @@ class ValidationSetManager:
         Args:
             name (str): The name of the validation set. (will not be shown to the labeler)
             instruction (str): The instruction to show to the labeler.
-            truths (list[list[Box]]): The truths for each datapoint. Outher list is for each datapoint, inner list is for each truth.\n
+            truths (list[list[Box]]): The truths for each datapoint. Outer list is for each datapoint, inner list is for each truth.\n
                 example:
                     datapoints: ["datapoint1", "datapoint2"]
                     truths: [[Box(0, 0, 100, 100)], [Box(50, 50, 150, 150)]] -> first datapoint the object is in the top left corner, second datapoint the object is in the center
@@ -318,7 +318,7 @@ class ValidationSetManager:
             name (str): The name of the validation set. (will not be shown to the labeler)
             instruction (str): The instruction to show to the labeler.
             truths (list[list[tuple[int, int]]]): The truths for each datapoint defined as start and endpoint based on miliseconds.
-            Outher list is for each datapoint, inner list is for each truth.\n
+                Outer list is for each datapoint, inner list is for each truth.\n
                 example:
                     datapoints: ["datapoint1", "datapoint2"]
                     truths: [[(0, 10)], [(20, 30)]] -> first datapoint the correct interval is from 0 to 10, second datapoint the correct interval is from 20 to 30
@@ -396,9 +396,6 @@ class ValidationSetManager:
         if validation_set_id is None:
             raise ValueError("Failed to create validation set")
-        if print_confirmation:
-            print(f"Validation set '{name}' created with ID {validation_set_id}")
         validation_set = RapidataValidationSet(
             name=name,
             validation_set_id=validation_set_id,
@@ -408,6 +405,12 @@ class ValidationSetManager:
         for rapid in tqdm(rapids, desc="Uploading validation tasks"):
             validation_set.add_rapid(rapid)
+        if print_confirmation:
+            print()
+            print(f"Validation set '{name}' created with ID {validation_set_id}\n",
+                  f"Now viewable under: https://app.{self.__openapi_service.enviroment}/validation-set/detail/{validation_set_id}",
+                  sep="")
         return validation_set

{rapidata-2.8.0.dist-info → rapidata-2.9.0.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.3
 Name: rapidata
-Version: 2.8.0
+Version: 2.9.0
 Summary: Rapidata package containing the Rapidata Python Client to interact with the Rapidata Web API in an easy way.
 License: Apache-2.0
 Author: Rapidata AG
@@ -14,6 +14,7 @@ Classifier: Programming Language :: Python :: 3.12
 Classifier: Programming Language :: Python :: 3.13
 Requires-Dist: colorama (==0.4.6)
 Requires-Dist: deprecated (>=1.2.14,<2.0.0)
+Requires-Dist: pandas (>=2.2.3,<3.0.0)
 Requires-Dist: pillow (>=10.4.0,<11.0.0)
 Requires-Dist: pydantic (>=2.8.2,<3.0.0)
 Requires-Dist: pyjwt (>=2.9.0,<3.0.0)

{rapidata-2.8.0.dist-info → rapidata-2.9.0.dist-info}/RECORD RENAMED Viewed

@@ -397,8 +397,9 @@ rapidata/rapidata_client/metadata/_select_words_metadata.py,sha256=I4qVtCkj60ljk
 rapidata/rapidata_client/order/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 rapidata/rapidata_client/order/_rapidata_dataset.py,sha256=ipSLGEQm6Z5Gj0Z13SmE5-uUwqUeEtC7SyGWx_7piuo,5439
 rapidata/rapidata_client/order/_rapidata_order_builder.py,sha256=N6mqmgneJSsb_no_Ps9BG3EhDekLgKxFYpjDCN-VVeg,13095
-rapidata/rapidata_client/order/rapidata_order.py,sha256=vlKsnYJBZWKZQQmH4zNcPQ_bsPP5bycwJ52FHaxlwSg,8997
+rapidata/rapidata_client/order/rapidata_order.py,sha256=XI9xeEtqZIwdAXLe9Pn4RO8iPNSoBToQ2WD62TRWzTE,9115
 rapidata/rapidata_client/order/rapidata_order_manager.py,sha256=4wW5xtmEtdewFGGwMWSMbdLZpHvygtLCfYNv4lcHGg8,27271
+rapidata/rapidata_client/order/rapidata_results.py,sha256=tCQgfv70FHJBcVsgAjqkYZB8ZvqrPGD_hlOmzArlLHg,5037
 rapidata/rapidata_client/rapidata_client.py,sha256=A9mnSX6wzVF9TxS1YH87hTi4jCn75dIuP3KZj5Y_vFg,1957
 rapidata/rapidata_client/referee/__init__.py,sha256=q0Hv9nmfEpyChejtyMLT8hWKL0vTTf_UgUXPYNJ-H6M,153
 rapidata/rapidata_client/referee/_base_referee.py,sha256=MdFOhdxt3sRnWXLDKLJZKFdVpjBGn9jypPnWWQ6msQA,496
@@ -430,7 +431,7 @@ rapidata/rapidata_client/validation/rapids/__init__.py,sha256=WU5PPwtTJlte6U90MD
 rapidata/rapidata_client/validation/rapids/box.py,sha256=t3_Kn6doKXdnJdtbwefXnYKPiTKHneJl9E2inkDSqL8,589
 rapidata/rapidata_client/validation/rapids/rapids.py,sha256=aWkcjWR6Pr2BFwz8a0MfqEkXnEJPkAbKMeQtGXnsags,4440
 rapidata/rapidata_client/validation/rapids/rapids_manager.py,sha256=4HOX6c42sCOfpGR2aDoiMgrfjontM8z2KEJwQp4ir6A,14247
-rapidata/rapidata_client/validation/validation_set_manager.py,sha256=X3T1L41v-B1s2JpE8szOpQNOj2ns6leA3NvomNn9TS0,22793
+rapidata/rapidata_client/validation/validation_set_manager.py,sha256=dv9a-Ms4bKOkcfyZfAb-RBjZ6cWT6imM_l3DDvg9aXU,22984
 rapidata/rapidata_client/workflow/__init__.py,sha256=eFRx0fm280alXpds6hYcnxN_yERlabF9B5sTdPFsL1g,430
 rapidata/rapidata_client/workflow/_base_workflow.py,sha256=XyIZFKS_RxAuwIHS848S3AyLEHqd07oTD_5jm2oUbsw,762
 rapidata/rapidata_client/workflow/_classify_workflow.py,sha256=9bT54wxVJgxC-zLk6MVNbseFpzYrvFPjt7DHvxqYfnk,1736
@@ -446,7 +447,7 @@ rapidata/service/credential_manager.py,sha256=Of0BQs_V1T7rkrWX9groLX790nOknaARwn
 rapidata/service/local_file_service.py,sha256=pgorvlWcx52Uh3cEG6VrdMK_t__7dacQ_5AnfY14BW8,877
 rapidata/service/openapi_service.py,sha256=Z4NrAuilLlIWBdGOv6otz36tHS_vvU36w5jmvOUTmqo,3198
 rapidata/service/token_manager.py,sha256=JZ5YbR5Di8dO3H4kK11d0kzWlrXxjgCmeNkHA4AapCM,6425
-rapidata-2.8.0.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
-rapidata-2.8.0.dist-info/METADATA,sha256=-OjSpzm7nH9aw1Lf8Kvbc8SpkHcItLygHaJfnRdpN58,1107
-rapidata-2.8.0.dist-info/WHEEL,sha256=IYZQI976HJqqOpQU6PHkJ8fb3tMNBFjg-Cn-pwAbaFM,88
-rapidata-2.8.0.dist-info/RECORD,,
+rapidata-2.9.0.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
+rapidata-2.9.0.dist-info/METADATA,sha256=7GbcyE9ZroILh90eiE2K7HuX_33Xoon2mZP8pRTjL_E,1146
+rapidata-2.9.0.dist-info/WHEEL,sha256=XbeZDeTWKc1w7CSIyre5aMDU_-PohRwTQceYnisIYYY,88
+rapidata-2.9.0.dist-info/RECORD,,

{rapidata-2.8.0.dist-info → rapidata-2.9.0.dist-info}/WHEEL RENAMED Viewed

@@ -1,4 +1,4 @@
 Wheel-Version: 1.0
-Generator: poetry-core 2.0.1
+Generator: poetry-core 2.1.1
 Root-Is-Purelib: true
 Tag: py3-none-any

{rapidata-2.8.0.dist-info → rapidata-2.9.0.dist-info}/LICENSE RENAMED Viewed

File without changes

rapidata 2.8.0__py3-none-any.whl → 2.9.0__py3-none-any.whl

Potentially problematic release.

rapidata 2.8.0py3-none-any.whl → 2.9.0py3-none-any.whl