PyPI - valor-lite - Versions diffs - 0.36.5__py3-none-any.whl → 0.37.5__py3-none-any.whl - Mend

valor-lite 0.36.5py3-none-any.whl → 0.37.5py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (38) hide show

valor_lite/cache/__init__.py +11 -0
valor_lite/cache/compute.py +211 -0
valor_lite/cache/ephemeral.py +302 -0
valor_lite/cache/persistent.py +536 -0
valor_lite/classification/__init__.py +5 -10
valor_lite/classification/annotation.py +4 -0
valor_lite/classification/computation.py +233 -251
valor_lite/classification/evaluator.py +882 -0
valor_lite/classification/loader.py +97 -0
valor_lite/classification/metric.py +141 -4
valor_lite/classification/shared.py +184 -0
valor_lite/classification/utilities.py +221 -118
valor_lite/exceptions.py +5 -0
valor_lite/object_detection/__init__.py +5 -4
valor_lite/object_detection/annotation.py +13 -1
valor_lite/object_detection/computation.py +367 -304
valor_lite/object_detection/evaluator.py +804 -0
valor_lite/object_detection/loader.py +292 -0
valor_lite/object_detection/metric.py +152 -3
valor_lite/object_detection/shared.py +206 -0
valor_lite/object_detection/utilities.py +182 -109
valor_lite/semantic_segmentation/__init__.py +5 -4
valor_lite/semantic_segmentation/annotation.py +7 -0
valor_lite/semantic_segmentation/computation.py +20 -110
valor_lite/semantic_segmentation/evaluator.py +414 -0
valor_lite/semantic_segmentation/loader.py +205 -0
valor_lite/semantic_segmentation/shared.py +149 -0
valor_lite/semantic_segmentation/utilities.py +6 -23
{valor_lite-0.36.5.dist-info → valor_lite-0.37.5.dist-info}/METADATA +3 -1
valor_lite-0.37.5.dist-info/RECORD +49 -0
{valor_lite-0.36.5.dist-info → valor_lite-0.37.5.dist-info}/WHEEL +1 -1
valor_lite/classification/manager.py +0 -545
valor_lite/object_detection/manager.py +0 -865
valor_lite/profiling.py +0 -374
valor_lite/semantic_segmentation/benchmark.py +0 -237
valor_lite/semantic_segmentation/manager.py +0 -446
valor_lite-0.36.5.dist-info/RECORD +0 -41
{valor_lite-0.36.5.dist-info → valor_lite-0.37.5.dist-info}/top_level.txt +0 -0

valor_lite/object_detection/utilities.py CHANGED Viewed

@@ -1,43 +1,24 @@
 from collections import defaultdict
 import numpy as np
+import pyarrow as pa
 from numpy.typing import NDArray
-from valor_lite.object_detection.computation import PairClassification
 from valor_lite.object_detection.metric import Metric, MetricType
 def unpack_precision_recall_into_metric_lists(
-    results: tuple[
-        tuple[
-            NDArray[np.float64],
-            NDArray[np.float64],
-        ],
-        tuple[
-            NDArray[np.float64],
-            NDArray[np.float64],
-        ],
-        NDArray[np.float64],
-        NDArray[np.float64],
-    ],
+    counts: NDArray[np.uint64],
+    precision_recall_f1: NDArray[np.float64],
+    average_precision: NDArray[np.float64],
+    mean_average_precision: NDArray[np.float64],
+    average_recall: NDArray[np.float64],
+    mean_average_recall: NDArray[np.float64],
+    pr_curve: NDArray[np.float64],
     iou_thresholds: list[float],
     score_thresholds: list[float],
-    index_to_label: list[str],
-    label_metadata: NDArray[np.int32],
+    index_to_label: dict[int, str],
 ):
-    (
-        (
-            average_precision,
-            mean_average_precision,
-        ),
-        (
-            average_recall,
-            mean_average_recall,
-        ),
-        precision_recall,
-        pr_curves,
-    ) = results
     metrics = defaultdict(list)
     metrics[MetricType.AP] = [
@@ -47,8 +28,7 @@ def unpack_precision_recall_into_metric_lists(
             label=label,
         )
         for iou_idx, iou_threshold in enumerate(iou_thresholds)
-        for label_idx, label in enumerate(index_to_label)
-        if int(label_metadata[label_idx, 0]) > 0
+        for label_idx, label in index_to_label.items()
     ]
     metrics[MetricType.mAP] = [
@@ -66,8 +46,7 @@ def unpack_precision_recall_into_metric_lists(
             iou_thresholds=iou_thresholds,
             label=label,
         )
-        for label_idx, label in enumerate(index_to_label)
-        if int(label_metadata[label_idx, 0]) > 0
+        for label_idx, label in index_to_label.items()
     ]
     # TODO - (c.zaloom) will be removed in the future
@@ -86,8 +65,7 @@ def unpack_precision_recall_into_metric_lists(
             label=label,
         )
         for score_idx, score_threshold in enumerate(score_thresholds)
-        for label_idx, label in enumerate(index_to_label)
-        if int(label_metadata[label_idx, 0]) > 0
+        for label_idx, label in index_to_label.items()
     ]
     metrics[MetricType.mAR] = [
@@ -107,8 +85,7 @@ def unpack_precision_recall_into_metric_lists(
             iou_thresholds=iou_thresholds,
             label=label,
         )
-        for label_idx, label in enumerate(index_to_label)
-        if int(label_metadata[label_idx, 0]) > 0
+        for label_idx, label in index_to_label.items()
     ]
     # TODO - (c.zaloom) will be removed in the future
@@ -122,24 +99,20 @@ def unpack_precision_recall_into_metric_lists(
     metrics[MetricType.PrecisionRecallCurve] = [
         Metric.precision_recall_curve(
-            precisions=pr_curves[iou_idx, label_idx, :, 0].tolist(),  # type: ignore[reportArgumentType]
-            scores=pr_curves[iou_idx, label_idx, :, 1].tolist(),  # type: ignore[reportArgumentType]
+            precisions=pr_curve[iou_idx, label_idx, :, 0].tolist(),
+            scores=pr_curve[iou_idx, label_idx, :, 1].tolist(),
             iou_threshold=iou_threshold,
             label=label,
         )
         for iou_idx, iou_threshold in enumerate(iou_thresholds)
-        for label_idx, label in enumerate(index_to_label)
-        if label_metadata[label_idx, 0] > 0
+        for label_idx, label in index_to_label.items()
     ]
-    for label_idx, label in enumerate(index_to_label):
-        if label_metadata[label_idx, 0] == 0:
-            continue
+    for label_idx, label in index_to_label.items():
         for score_idx, score_threshold in enumerate(score_thresholds):
             for iou_idx, iou_threshold in enumerate(iou_thresholds):
-                row = precision_recall[iou_idx, score_idx, label_idx, :]
+                row = counts[iou_idx, score_idx, :, label_idx]
                 kwargs = {
                     "label": label,
                     "iou_threshold": iou_threshold,
@@ -154,21 +127,22 @@ def unpack_precision_recall_into_metric_lists(
                     )
                 )
+                row = precision_recall_f1[iou_idx, score_idx, :, label_idx]
                 metrics[MetricType.Precision].append(
                     Metric.precision(
-                        value=float(row[3]),
+                        value=float(row[0]),
                         **kwargs,
                     )
                 )
                 metrics[MetricType.Recall].append(
                     Metric.recall(
-                        value=float(row[4]),
+                        value=float(row[1]),
                         **kwargs,
                     )
                 )
                 metrics[MetricType.F1].append(
                     Metric.f1_score(
-                        value=float(row[5]),
+                        value=float(row[2]),
                         **kwargs,
                     )
                 )
@@ -176,40 +150,153 @@ def unpack_precision_recall_into_metric_lists(
     return metrics
-def _create_empty_confusion_matrix(index_to_labels: list[str]):
-    unmatched_ground_truths = dict()
+def unpack_confusion_matrix(
+    confusion_matrices: NDArray[np.uint64],
+    unmatched_groundtruths: NDArray[np.uint64],
+    unmatched_predictions: NDArray[np.uint64],
+    index_to_label: dict[int, str],
+    iou_thresholds: list[float],
+    score_thresholds: list[float],
+) -> list[Metric]:
+    metrics = []
+    for iou_idx, iou_thresh in enumerate(iou_thresholds):
+        for score_idx, score_thresh in enumerate(score_thresholds):
+            cm_dict = {}
+            ugt_dict = {}
+            upd_dict = {}
+            for idx, label in index_to_label.items():
+                ugt_dict[label] = int(
+                    unmatched_groundtruths[iou_idx, score_idx, idx]
+                )
+                upd_dict[label] = int(
+                    unmatched_predictions[iou_idx, score_idx, idx]
+                )
+                for pidx, plabel in index_to_label.items():
+                    if label not in cm_dict:
+                        cm_dict[label] = {}
+                    cm_dict[label][plabel] = int(
+                        confusion_matrices[iou_idx, score_idx, idx, pidx]
+                    )
+            metrics.append(
+                Metric.confusion_matrix(
+                    confusion_matrix=cm_dict,
+                    unmatched_ground_truths=ugt_dict,
+                    unmatched_predictions=upd_dict,
+                    iou_threshold=iou_thresh,
+                    score_threshold=score_thresh,
+                )
+            )
+    return metrics
+def create_mapping(
+    tbl: pa.Table,
+    pairs: NDArray[np.float64],
+    index: int,
+    id_col: str,
+    uid_col: str,
+) -> dict[int, str]:
+    col = pairs[:, index].astype(np.int64)
+    values, indices = np.unique(col, return_index=True)
+    indices = indices[values >= 0]
+    return {
+        tbl[id_col][idx].as_py(): tbl[uid_col][idx].as_py() for idx in indices
+    }
+def unpack_examples(
+    detailed_pairs: NDArray[np.float64],
+    mask_tp: NDArray[np.bool_],
+    mask_fn: NDArray[np.bool_],
+    mask_fp: NDArray[np.bool_],
+    iou_thresholds: list[float],
+    score_thresholds: list[float],
+    index_to_datum_id: dict[int, str],
+    index_to_groundtruth_id: dict[int, str],
+    index_to_prediction_id: dict[int, str],
+) -> list[Metric]:
+    metrics = []
+    ids = detailed_pairs[:, :5].astype(np.int64)
+    unique_datums = np.unique(detailed_pairs[:, 0].astype(np.int64))
+    for datum_index in unique_datums:
+        mask_datum = detailed_pairs[:, 0] == datum_index
+        mask_datum_tp = mask_tp & mask_datum
+        mask_datum_fp = mask_fp & mask_datum
+        mask_datum_fn = mask_fn & mask_datum
+        datum_id = index_to_datum_id[datum_index]
+        for iou_idx, iou_thresh in enumerate(iou_thresholds):
+            for score_idx, score_thresh in enumerate(score_thresholds):
+                unique_tp = np.unique(
+                    ids[np.ix_(mask_datum_tp[iou_idx, score_idx], (0, 1, 2, 3, 4))], axis=0  # type: ignore - numpy ix_ typing
+                )
+                unique_fp = np.unique(
+                    ids[np.ix_(mask_datum_fp[iou_idx, score_idx], (0, 2, 4))], axis=0  # type: ignore - numpy ix_ typing
+                )
+                unique_fn = np.unique(
+                    ids[np.ix_(mask_datum_fn[iou_idx, score_idx], (0, 1, 3))], axis=0  # type: ignore - numpy ix_ typing
+                )
+                tp = [
+                    (
+                        index_to_groundtruth_id[row[1]],
+                        index_to_prediction_id[row[2]],
+                    )
+                    for row in unique_tp
+                ]
+                fp = [index_to_prediction_id[row[1]] for row in unique_fp]
+                fn = [index_to_groundtruth_id[row[1]] for row in unique_fn]
+                metrics.append(
+                    Metric.examples(
+                        datum_id=datum_id,
+                        true_positives=tp,
+                        false_negatives=fn,
+                        false_positives=fp,
+                        iou_threshold=iou_thresh,
+                        score_threshold=score_thresh,
+                    )
+                )
+    return metrics
+def create_empty_confusion_matrix_with_examples(
+    iou_threhsold: float,
+    score_threshold: float,
+    index_to_label: dict[int, str],
+) -> Metric:
+    unmatched_groundtruths = dict()
     unmatched_predictions = dict()
     confusion_matrix = dict()
-    for label in index_to_labels:
-        unmatched_ground_truths[label] = {"count": 0, "examples": []}
+    for label in index_to_label.values():
+        unmatched_groundtruths[label] = {"count": 0, "examples": []}
         unmatched_predictions[label] = {"count": 0, "examples": []}
         confusion_matrix[label] = {}
-        for plabel in index_to_labels:
+        for plabel in index_to_label.values():
             confusion_matrix[label][plabel] = {"count": 0, "examples": []}
-    return (
-        confusion_matrix,
-        unmatched_predictions,
-        unmatched_ground_truths,
+    return Metric.confusion_matrix_with_examples(
+        confusion_matrix=confusion_matrix,
+        unmatched_ground_truths=unmatched_groundtruths,
+        unmatched_predictions=unmatched_predictions,
+        iou_threshold=iou_threhsold,
+        score_threshold=score_threshold,
     )
-def _unpack_confusion_matrix(
+def _unpack_confusion_matrix_with_examples(
+    metric: Metric,
     ids: NDArray[np.int32],
     mask_matched: NDArray[np.bool_],
     mask_fp_unmatched: NDArray[np.bool_],
     mask_fn_unmatched: NDArray[np.bool_],
-    index_to_datum_id: list[str],
-    index_to_groundtruth_id: list[str],
-    index_to_prediction_id: list[str],
-    index_to_label: list[str],
-    iou_threhsold: float,
-    score_threshold: float,
+    index_to_datum_id: dict[int, str],
+    index_to_groundtruth_id: dict[int, str],
+    index_to_prediction_id: dict[int, str],
+    index_to_label: dict[int, str],
 ):
-    (
-        confusion_matrix,
-        unmatched_predictions,
-        unmatched_ground_truths,
-    ) = _create_empty_confusion_matrix(index_to_label)
+    if not isinstance(metric.value, dict):
+        raise TypeError("expected metric to contain a dictionary value")
     unique_matches = np.unique(
         ids[np.ix_(mask_matched, (0, 1, 2, 3, 4))], axis=0  # type: ignore - numpy ix_ typing
@@ -229,8 +316,8 @@ def _unpack_confusion_matrix(
     for idx in range(n_max):
         if idx < n_unmatched_groundtruths:
             label = index_to_label[unique_unmatched_groundtruths[idx, 2]]
-            unmatched_ground_truths[label]["count"] += 1
-            unmatched_ground_truths[label]["examples"].append(
+            metric.value["unmatched_ground_truths"][label]["count"] += 1
+            metric.value["unmatched_ground_truths"][label]["examples"].append(
                 {
                     "datum_id": index_to_datum_id[
                         unique_unmatched_groundtruths[idx, 0]
@@ -241,9 +328,10 @@ def _unpack_confusion_matrix(
                 }
             )
         if idx < n_unmatched_predictions:
-            label = index_to_label[unique_unmatched_predictions[idx, 2]]
-            unmatched_predictions[label]["count"] += 1
-            unmatched_predictions[label]["examples"].append(
+            label_id = unique_unmatched_predictions[idx, 2]
+            label = index_to_label[label_id]
+            metric.value["unmatched_predictions"][label]["count"] += 1
+            metric.value["unmatched_predictions"][label]["examples"].append(
                 {
                     "datum_id": index_to_datum_id[
                         unique_unmatched_predictions[idx, 0]
@@ -256,8 +344,10 @@ def _unpack_confusion_matrix(
         if idx < n_matched:
             glabel = index_to_label[unique_matches[idx, 3]]
             plabel = index_to_label[unique_matches[idx, 4]]
-            confusion_matrix[glabel][plabel]["count"] += 1
-            confusion_matrix[glabel][plabel]["examples"].append(
+            metric.value["confusion_matrix"][glabel][plabel]["count"] += 1
+            metric.value["confusion_matrix"][glabel][plabel][
+                "examples"
+            ].append(
                 {
                     "datum_id": index_to_datum_id[unique_matches[idx, 0]],
                     "ground_truth_id": index_to_groundtruth_id[
@@ -269,43 +359,29 @@ def _unpack_confusion_matrix(
                 }
             )
-    return Metric.confusion_matrix(
-        confusion_matrix=confusion_matrix,
-        unmatched_ground_truths=unmatched_ground_truths,
-        unmatched_predictions=unmatched_predictions,
-        iou_threshold=iou_threhsold,
-        score_threshold=score_threshold,
-    )
+    return metric
-def unpack_confusion_matrix_into_metric_list(
-    results: NDArray[np.uint8],
+def unpack_confusion_matrix_with_examples(
+    metrics: dict[int, dict[int, Metric]],
     detailed_pairs: NDArray[np.float64],
-    iou_thresholds: list[float],
-    score_thresholds: list[float],
-    index_to_datum_id: list[str],
-    index_to_groundtruth_id: list[str],
-    index_to_prediction_id: list[str],
-    index_to_label: list[str],
+    mask_tp: NDArray[np.bool_],
+    mask_fp_fn_misclf: NDArray[np.bool_],
+    mask_fp_unmatched: NDArray[np.bool_],
+    mask_fn_unmatched: NDArray[np.bool_],
+    index_to_datum_id: dict[int, str],
+    index_to_groundtruth_id: dict[int, str],
+    index_to_prediction_id: dict[int, str],
+    index_to_label: dict[int, str],
 ) -> list[Metric]:
     ids = detailed_pairs[:, :5].astype(np.int32)
-    mask_matched = (
-        np.bitwise_and(
-            results, PairClassification.TP | PairClassification.FP_FN_MISCLF
-        )
-        > 0
-    )
-    mask_fp_unmatched = (
-        np.bitwise_and(results, PairClassification.FP_UNMATCHED) > 0
-    )
-    mask_fn_unmatched = (
-        np.bitwise_and(results, PairClassification.FN_UNMATCHED) > 0
-    )
+    mask_matched = mask_tp | mask_fp_fn_misclf
     return [
-        _unpack_confusion_matrix(
+        _unpack_confusion_matrix_with_examples(
+            metric=metric,
             ids=ids,
             mask_matched=mask_matched[iou_idx, score_idx],
             mask_fp_unmatched=mask_fp_unmatched[iou_idx, score_idx],
@@ -314,10 +390,7 @@ def unpack_confusion_matrix_into_metric_list(
             index_to_groundtruth_id=index_to_groundtruth_id,
             index_to_prediction_id=index_to_prediction_id,
             index_to_label=index_to_label,
-            iou_threhsold=iou_threshold,
-            score_threshold=score_threshold,
         )
-        for iou_idx, iou_threshold in enumerate(iou_thresholds)
-        for score_idx, score_threshold in enumerate(score_thresholds)
-        if (results[iou_idx, score_idx] != -1).any()
+        for iou_idx, inner in metrics.items()
+        for score_idx, metric in inner.items()
     ]

valor_lite/semantic_segmentation/__init__.py CHANGED Viewed

@@ -1,14 +1,15 @@
 from .annotation import Bitmask, Segmentation
-from .manager import DataLoader, Evaluator, Filter, Metadata
+from .evaluator import Builder, Evaluator, EvaluatorInfo
+from .loader import Loader
 from .metric import Metric, MetricType
 __all__ = [
-    "DataLoader",
+    "Builder",
+    "Loader",
     "Evaluator",
     "Segmentation",
     "Bitmask",
     "Metric",
     "MetricType",
-    "Filter",
-    "Metadata",
+    "EvaluatorInfo",
 ]

valor_lite/semantic_segmentation/annotation.py CHANGED Viewed

@@ -1,5 +1,6 @@
 import warnings
 from dataclasses import dataclass, field
+from typing import Any
 import numpy as np
 from numpy.typing import NDArray
@@ -16,6 +17,8 @@ class Bitmask:
         A NumPy array of boolean values representing the mask.
     label : str
         The semantic label associated with the mask.
+    metadata : dict[str, Any], optional
+        A dictionary containing any metadata to be used within filtering operations.
     Examples
     --------
@@ -26,6 +29,7 @@ class Bitmask:
     mask: NDArray[np.bool_]
     label: str
+    metadata: dict[str, Any] | None = None
     def __post_init__(self):
         if self.mask.dtype != np.bool_:
@@ -51,6 +55,8 @@ class Segmentation:
         The shape of the segmentation masks. This is set automatically after initialization.
     size : int, optional
         The total number of pixels in the masks. This is set automatically after initialization.
+    metadata : dict[str, Any], optional
+        A dictionary containing any metadata to be used within filtering operations.
     Examples
     --------
@@ -71,6 +77,7 @@ class Segmentation:
     predictions: list[Bitmask]
     shape: tuple[int, ...]
     size: int = field(default=0)
+    metadata: dict[str, Any] | None = None
     def __post_init__(self):

valor-lite 0.36.5__py3-none-any.whl → 0.37.5__py3-none-any.whl

valor-lite 0.36.5py3-none-any.whl → 0.37.5py3-none-any.whl