PyPI - scale-nucleus - Versions diffs - 0.1.22__py3-none-any.whl → 0.6.4__py3-none-any.whl - Mend

scale-nucleus 0.1.22py3-none-any.whl → 0.6.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (73) hide show

cli/client.py +14 -0
cli/datasets.py +77 -0
cli/helpers/__init__.py +0 -0
cli/helpers/nucleus_url.py +10 -0
cli/helpers/web_helper.py +40 -0
cli/install_completion.py +33 -0
cli/jobs.py +42 -0
cli/models.py +35 -0
cli/nu.py +42 -0
cli/reference.py +8 -0
cli/slices.py +62 -0
cli/tests.py +121 -0
nucleus/__init__.py +453 -699
nucleus/annotation.py +435 -80
nucleus/autocurate.py +9 -0
nucleus/connection.py +87 -0
nucleus/constants.py +12 -2
nucleus/data_transfer_object/__init__.py +0 -0
nucleus/data_transfer_object/dataset_details.py +9 -0
nucleus/data_transfer_object/dataset_info.py +26 -0
nucleus/data_transfer_object/dataset_size.py +5 -0
nucleus/data_transfer_object/scenes_list.py +18 -0
nucleus/dataset.py +1139 -215
nucleus/dataset_item.py +130 -26
nucleus/dataset_item_uploader.py +297 -0
nucleus/deprecation_warning.py +32 -0
nucleus/errors.py +21 -1
nucleus/job.py +71 -3
nucleus/logger.py +9 -0
nucleus/metadata_manager.py +45 -0
nucleus/metrics/__init__.py +10 -0
nucleus/metrics/base.py +117 -0
nucleus/metrics/categorization_metrics.py +197 -0
nucleus/metrics/errors.py +7 -0
nucleus/metrics/filters.py +40 -0
nucleus/metrics/geometry.py +198 -0
nucleus/metrics/metric_utils.py +28 -0
nucleus/metrics/polygon_metrics.py +480 -0
nucleus/metrics/polygon_utils.py +299 -0
nucleus/model.py +121 -15
nucleus/model_run.py +34 -57
nucleus/payload_constructor.py +30 -18
nucleus/prediction.py +259 -17
nucleus/pydantic_base.py +26 -0
nucleus/retry_strategy.py +4 -0
nucleus/scene.py +204 -19
nucleus/slice.py +230 -67
nucleus/upload_response.py +20 -9
nucleus/url_utils.py +4 -0
nucleus/utils.py +139 -35
nucleus/validate/__init__.py +24 -0
nucleus/validate/client.py +168 -0
nucleus/validate/constants.py +20 -0
nucleus/validate/data_transfer_objects/__init__.py +0 -0
nucleus/validate/data_transfer_objects/eval_function.py +81 -0
nucleus/validate/data_transfer_objects/scenario_test.py +19 -0
nucleus/validate/data_transfer_objects/scenario_test_evaluations.py +11 -0
nucleus/validate/data_transfer_objects/scenario_test_metric.py +12 -0
nucleus/validate/errors.py +6 -0
nucleus/validate/eval_functions/__init__.py +0 -0
nucleus/validate/eval_functions/available_eval_functions.py +212 -0
nucleus/validate/eval_functions/base_eval_function.py +60 -0
nucleus/validate/scenario_test.py +143 -0
nucleus/validate/scenario_test_evaluation.py +114 -0
nucleus/validate/scenario_test_metric.py +14 -0
nucleus/validate/utils.py +8 -0
{scale_nucleus-0.1.22.dist-info → scale_nucleus-0.6.4.dist-info}/LICENSE +0 -0
scale_nucleus-0.6.4.dist-info/METADATA +213 -0
scale_nucleus-0.6.4.dist-info/RECORD +71 -0
{scale_nucleus-0.1.22.dist-info → scale_nucleus-0.6.4.dist-info}/WHEEL +1 -1
scale_nucleus-0.6.4.dist-info/entry_points.txt +3 -0
scale_nucleus-0.1.22.dist-info/METADATA +0 -85
scale_nucleus-0.1.22.dist-info/RECORD +0 -21

nucleus/prediction.py CHANGED Viewed

@@ -1,52 +1,112 @@
-from typing import Dict, Optional, List
+"""
+All of the prediction types supported. In general, prediction types are the same
+as annotation types, but come with additional, optional data that can be attached
+such as confidence or probability distributions.
+"""
+from dataclasses import dataclass, field
+from typing import Dict, List, Optional, Union
 from .annotation import (
     BoxAnnotation,
+    CategoryAnnotation,
+    CuboidAnnotation,
     Point,
+    Point3D,
     PolygonAnnotation,
     Segment,
     SegmentationAnnotation,
-    CuboidAnnotation,
-    Point3D,
 )
 from .constants import (
     ANNOTATION_ID_KEY,
+    ANNOTATIONS_KEY,
     BOX_TYPE,
+    CATEGORY_TYPE,
+    CLASS_PDF_KEY,
+    CONFIDENCE_KEY,
     CUBOID_TYPE,
-    POLYGON_TYPE,
-    REFERENCE_ID_KEY,
-    METADATA_KEY,
+    DIMENSIONS_KEY,
     GEOMETRY_KEY,
+    HEIGHT_KEY,
     LABEL_KEY,
+    MASK_URL_KEY,
+    METADATA_KEY,
+    POLYGON_TYPE,
+    POSITION_KEY,
+    REFERENCE_ID_KEY,
+    TAXONOMY_NAME_KEY,
     TYPE_KEY,
+    VERTICES_KEY,
+    WIDTH_KEY,
     X_KEY,
     Y_KEY,
-    WIDTH_KEY,
-    HEIGHT_KEY,
-    CLASS_PDF_KEY,
-    CONFIDENCE_KEY,
-    VERTICES_KEY,
-    ANNOTATIONS_KEY,
-    MASK_URL_KEY,
-    POSITION_KEY,
-    DIMENSIONS_KEY,
     YAW_KEY,
 )
 def from_json(payload: dict):
+    """Instantiates prediction object from schematized JSON dict payload."""
     if payload.get(TYPE_KEY, None) == BOX_TYPE:
         return BoxPrediction.from_json(payload)
     elif payload.get(TYPE_KEY, None) == POLYGON_TYPE:
         return PolygonPrediction.from_json(payload)
     elif payload.get(TYPE_KEY, None) == CUBOID_TYPE:
         return CuboidPrediction.from_json(payload)
+    elif payload.get(TYPE_KEY, None) == CATEGORY_TYPE:
+        return CategoryPrediction.from_json(payload)
     else:
         return SegmentationPrediction.from_json(payload)
 class SegmentationPrediction(SegmentationAnnotation):
-    # No need to define init or to_payload methods because
-    # we default to functions defined in the parent class
+    """Predicted segmentation mask on a 2D image.
+    ::
+        from nucleus import SegmentationPrediction
+        segmentation = SegmentationPrediction(
+            mask_url="s3://your-bucket-name/pred-seg-masks/image_2_pred_mask_id1.png",
+            annotations=[
+                Segment(label="grass", index="1"),
+                Segment(label="road", index="2"),
+                Segment(label="bus", index="3", metadata={"vehicle_color": "yellow"}),
+                Segment(label="tree", index="4")
+            ],
+            reference_id="image_2",
+            annotation_id="image_2_pred_mask_1",
+        )
+    Parameters:
+        mask_url (str): A URL pointing to the segmentation prediction mask which is
+          accessible to Scale. The mask is an HxW int8 array saved in PNG format,
+          with each pixel value ranging from [0, N), where N is the number of
+          possible classes (for semantic segmentation) or instances (for instance
+          segmentation).
+          The height and width of the mask must be the same as the
+          original image. One example for semantic segmentation: the mask is 0
+          for pixels where there is background, 1 where there is a car, and 2
+          where there is a pedestrian.
+          Another example for instance segmentation: the mask is 0 for one car,
+          1 for another car, 2 for a motorcycle and 3 for another motorcycle.
+          The class name for each value in the mask is stored in the list of
+          Segment objects passed for "annotations"
+        annotations (List[:class:`Segment`]): The list of mappings between the integer values contained
+          in mask_url and string class labels. In the semantic segmentation
+          example above these would map that 0 to background, 1 to car and 2 to
+          pedestrian. In the instance segmentation example above, 0 and 1 would
+          both be mapped to car, 2 and 3 would both be mapped to motorcycle
+        reference_id (str): User-defined ID of the image to which to apply this annotation.
+        annotation_id (Optional[str]): For segmentation predictions, this value is ignored
+          because there can only be one segmentation prediction per dataset item.
+          Therefore regardless of annotation ID, if there is an existing
+          segmentation on a dataset item, it will be ignored unless update=True
+          is passed to :meth:`Dataset.annotate`, in which case it will be overwritten.
+          Storing a custom ID here may be useful in order to tie this annotation
+          to an external database, and its value will be returned for any export.
+    """
     @classmethod
     def from_json(cls, payload: dict):
         return cls(
@@ -61,6 +121,36 @@ class SegmentationPrediction(SegmentationAnnotation):
 class BoxPrediction(BoxAnnotation):
+    """Prediction of a bounding box.
+    Parameters:
+        label (str): The label for this annotation (e.g. car, pedestrian, bicycle)
+        x (Union[float, int]): The distance, in pixels, between the left border
+            of the bounding box and the left border of the image.
+        y (Union[float, int]): The distance, in pixels, between the top border
+            of the bounding box and the top border of the image.
+        width (Union[float, int]): The width in pixels of the annotation.
+        height (Union[float, int]): The height in pixels of the annotation.
+        reference_id (str): User-defined ID of the image to which to apply this
+            annotation.
+        confidence: 0-1 indicating the confidence of the prediction.
+        annotation_id (Optional[str]): The annotation ID that uniquely
+            identifies this annotation within its target dataset item. Upon ingest,
+            a matching annotation id will be ignored by default, and updated if
+            update=True for dataset.annotate.  If no annotation ID is passed, one
+            will be automatically generated using the label, x, y, width, and
+            height, so that you can make inserts idempotently and identical boxes
+            will be ignored.
+        metadata (Optional[Dict]): Arbitrary key/value dictionary of info to
+            attach to this annotation.  Strings, floats and ints are supported best
+            by querying and insights features within Nucleus. For more details see
+            our `metadata guide <https://nucleus.scale.com/docs/upload-metadata>`_.
+        class_pdf: An optional complete class probability distribution on this
+            annotation. Each value should be between 0 and 1 (inclusive), and sum up to
+            1 as a complete distribution. This can be useful for computing entropy to
+            surface places where the model is most uncertain.
+    """
     def __init__(
         self,
         label: str,
@@ -114,6 +204,28 @@ class BoxPrediction(BoxAnnotation):
 class PolygonPrediction(PolygonAnnotation):
+    """Prediction of a polygon.
+    Parameters:
+        label (str): The label for this annotation (e.g. car, pedestrian, bicycle).
+        vertices List[:class:`Point`]: The list of points making up the polygon.
+        reference_id (str): User-defined ID of the image to which to apply this
+            annotation.
+        confidence: 0-1 indicating the confidence of the prediction.
+        annotation_id (Optional[str]): The annotation ID that uniquely identifies
+            this annotation within its target dataset item. Upon ingest, a matching
+            annotation id will be ignored by default, and updated if update=True
+            for dataset.annotate.
+        metadata (Optional[Dict]): Arbitrary key/value dictionary of info to
+            attach to this annotation.  Strings, floats and ints are supported best
+            by querying and insights features within Nucleus. For more details see
+            our `metadata guide <https://nucleus.scale.com/docs/upload-metadata>`_.
+        class_pdf: An optional complete class probability distribution on this
+            annotation. Each value should be between 0 and 1 (inclusive), and sum up to
+            1 as a complete distribution. This can be useful for computing entropy to
+            surface places where the model is most uncertain.
+    """
     def __init__(
         self,
         label: str,
@@ -160,6 +272,29 @@ class PolygonPrediction(PolygonAnnotation):
 class CuboidPrediction(CuboidAnnotation):
+    """A prediction of 3D cuboid.
+    Parameters:
+        label (str): The label for this annotation (e.g. car, pedestrian, bicycle)
+        position (:class:`Point3D`): The point at the center of the cuboid
+        dimensions (:class:`Point3D`): The length (x), width (y), and height (z) of the cuboid
+        yaw (float): The rotation, in radians, about the Z axis of the cuboid
+        reference_id (str): User-defined ID of the image to which to apply this annotation.
+        confidence: 0-1 indicating the confidence of the prediction.
+        annotation_id (Optional[str]): The annotation ID that uniquely identifies this
+          annotation within its target dataset item. Upon ingest, a matching
+          annotation id will be ignored by default, and updated if update=True
+          for dataset.annotate.
+        metadata (Optional[str]): Arbitrary key/value dictionary of info to attach to this
+          annotation.  Strings, floats and ints are supported best by querying
+          and insights features within Nucleus. For more details see our `metadata
+          guide <https://nucleus.scale.com/docs/upload-metadata>`_.
+        class_pdf: An optional complete class probability distribution on this
+            annotation. Each value should be between 0 and 1 (inclusive), and sum up to
+            1 as a complete distribution. This can be useful for computing entropy to
+            surface places where the model is most uncertain.
+    """
     def __init__(
         self,
         label: str,
@@ -207,3 +342,110 @@ class CuboidPrediction(CuboidAnnotation):
             metadata=payload.get(METADATA_KEY, {}),
             class_pdf=payload.get(CLASS_PDF_KEY, None),
         )
+class CategoryPrediction(CategoryAnnotation):
+    """A prediction of a category.
+    Parameters:
+        label: The label for this annotation (e.g. car, pedestrian, bicycle).
+        reference_id: The reference ID of the image you wish to apply this annotation to.
+        taxonomy_name: The name of the taxonomy this annotation conforms to.
+          See :meth:`Dataset.add_taxonomy`.
+        confidence: 0-1 indicating the confidence of the prediction.
+        class_pdf: An optional complete class probability distribution on this
+            prediction. Each value should be between 0 and 1 (inclusive), and sum up to
+            1 as a complete distribution. This can be useful for computing entropy to
+            surface places where the model is most uncertain.
+        metadata: Arbitrary key/value dictionary of info to attach to this annotation.
+            Strings, floats and ints are supported best by querying and insights
+            features within Nucleus. For more details see our `metadata guide
+            <https://nucleus.scale.com/docs/upload-metadata>`_.
+    """
+    def __init__(
+        self,
+        label: str,
+        reference_id: str,
+        taxonomy_name: Optional[str] = None,
+        confidence: Optional[float] = None,
+        metadata: Optional[Dict] = None,
+        class_pdf: Optional[Dict] = None,
+    ):
+        super().__init__(
+            label=label,
+            taxonomy_name=taxonomy_name,
+            reference_id=reference_id,
+            metadata=metadata,
+        )
+        self.confidence = confidence
+        self.class_pdf = class_pdf
+    def to_payload(self) -> dict:
+        payload = super().to_payload()
+        if self.confidence is not None:
+            payload[CONFIDENCE_KEY] = self.confidence
+        if self.class_pdf is not None:
+            payload[CLASS_PDF_KEY] = self.class_pdf
+        return payload
+    @classmethod
+    def from_json(cls, payload: dict):
+        return cls(
+            label=payload.get(LABEL_KEY, 0),
+            taxonomy_name=payload.get(TAXONOMY_NAME_KEY, None),
+            reference_id=payload[REFERENCE_ID_KEY],
+            confidence=payload.get(CONFIDENCE_KEY, None),
+            metadata=payload.get(METADATA_KEY, {}),
+            class_pdf=payload.get(CLASS_PDF_KEY, None),
+        )
+Prediction = Union[
+    BoxPrediction,
+    PolygonPrediction,
+    CuboidPrediction,
+    CategoryPrediction,
+    SegmentationPrediction,
+]
+@dataclass
+class PredictionList:
+    """Wrapper class separating a list of predictions by type."""
+    box_predictions: List[BoxPrediction] = field(default_factory=list)
+    polygon_predictions: List[PolygonPrediction] = field(default_factory=list)
+    cuboid_predictions: List[CuboidPrediction] = field(default_factory=list)
+    category_predictions: List[CategoryPrediction] = field(
+        default_factory=list
+    )
+    segmentation_predictions: List[SegmentationPrediction] = field(
+        default_factory=list
+    )
+    def add_predictions(self, predictions: List[Prediction]):
+        for prediction in predictions:
+            if isinstance(prediction, BoxPrediction):
+                self.box_predictions.append(prediction)
+            elif isinstance(prediction, PolygonPrediction):
+                self.polygon_predictions.append(prediction)
+            elif isinstance(prediction, CuboidPrediction):
+                self.cuboid_predictions.append(prediction)
+            elif isinstance(prediction, CategoryPrediction):
+                self.category_predictions.append(prediction)
+            else:
+                assert isinstance(
+                    prediction, SegmentationPrediction
+                ), f"Unexpected prediction type: {type(prediction)}"
+                self.segmentation_predictions.append(prediction)
+    def __len__(self):
+        return (
+            len(self.box_predictions)
+            + len(self.polygon_predictions)
+            + len(self.cuboid_predictions)
+            + len(self.category_predictions)
+            + len(self.segmentation_predictions)
+        )

nucleus/pydantic_base.py ADDED Viewed

@@ -0,0 +1,26 @@
+from pydantic import BaseModel  # pylint: disable=no-name-in-module
+class ImmutableModel(BaseModel):
+    class Config:
+        allow_mutation = False
+class DictCompatibleModel(BaseModel):
+    """Backwards compatible wrapper where we transform dictionaries into Pydantic Models
+    Allows us to access model.key with model["key"].
+    """
+    def __getitem__(self, key):
+        return getattr(self, key)
+class DictCompatibleImmutableModel(ImmutableModel):
+    """Backwards compatible wrapper where we transform dictionaries into Pydantic Models
+    Allows us to access model.key with model["key"].
+    """
+    def __getitem__(self, key):
+        return getattr(self, key)

nucleus/retry_strategy.py ADDED Viewed

@@ -0,0 +1,4 @@
+# TODO: use retry library instead of custom code. Tenacity is one option.
+class RetryStrategy:
+    statuses = {503, 524, 520, 504}
+    sleep_times = [1, 3, 9]

scale-nucleus 0.1.22__py3-none-any.whl → 0.6.4__py3-none-any.whl

scale-nucleus 0.1.22py3-none-any.whl → 0.6.4py3-none-any.whl