PyPI - valor-lite - Versions diffs - 0.33.11__tar.gz → 0.33.13__tar.gz - Mend

valor-lite 0.33.11tar.gz → 0.33.13tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of valor-lite might be problematic. Click here for more details.

Files changed (80) hide show

{valor_lite-0.33.11/valor_lite.egg-info → valor_lite-0.33.13}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: valor-lite
-Version: 0.33.11
+Version: 0.33.13
 Summary: Compute valor metrics locally.
 License: MIT License

{valor_lite-0.33.11 → valor_lite-0.33.13}/tests/classification/test_accuracy.py RENAMED Viewed

@@ -53,18 +53,12 @@ def test_accuracy_computation():
     )
     # score threshold, label, count metric
-    assert accuracy.shape == (2, 4)
+    assert accuracy.shape == (2,)
     # score >= 0.25
-    assert accuracy[0][0] == 2 / 3
-    assert accuracy[0][1] == 1.0
-    assert accuracy[0][2] == 2 / 3
-    assert accuracy[0][3] == 1.0
+    assert accuracy[0] == 2 / 3
     # score >= 0.75
-    assert accuracy[1][0] == 2 / 3
-    assert accuracy[1][1] == 1.0
-    assert accuracy[1][2] == 2 / 3
-    assert accuracy[1][3] == 2 / 3
+    assert accuracy[1] == 1 / 3
 def test_accuracy_basic(basic_classifications: list[Classification]):
@@ -87,20 +81,10 @@ def test_accuracy_basic(basic_classifications: list[Classification]):
     expected_metrics = [
         {
             "type": "Accuracy",
-            "value": [2 / 3, 2 / 3],
+            "value": [2 / 3, 1 / 3],
             "parameters": {
                 "score_thresholds": [0.25, 0.75],
                 "hardmax": True,
-                "label": "0",
-            },
-        },
-        {
-            "type": "Accuracy",
-            "value": [1.0, 2 / 3],
-            "parameters": {
-                "score_thresholds": [0.25, 0.75],
-                "hardmax": True,
-                "label": "3",
             },
         },
     ]
@@ -124,29 +108,10 @@ def test_accuracy_with_animal_example(
     expected_metrics = [
         {
             "type": "Accuracy",
-            "value": [2.0 / 3.0],
-            "parameters": {
-                "score_thresholds": [0.5],
-                "hardmax": True,
-                "label": "bird",
-            },
-        },
-        {
-            "type": "Accuracy",
-            "value": [0.5],
+            "value": [2.0 / 6.0],
             "parameters": {
                 "score_thresholds": [0.5],
                 "hardmax": True,
-                "label": "dog",
-            },
-        },
-        {
-            "type": "Accuracy",
-            "value": [2 / 3],
-            "parameters": {
-                "score_thresholds": [0.5],
-                "hardmax": True,
-                "label": "cat",
             },
         },
     ]
@@ -170,38 +135,10 @@ def test_accuracy_color_example(
     expected_metrics = [
         {
             "type": "Accuracy",
-            "value": [2 / 3],
-            "parameters": {
-                "score_thresholds": [0.5],
-                "hardmax": True,
-                "label": "white",
-            },
-        },
-        {
-            "type": "Accuracy",
-            "value": [2 / 3],
+            "value": [2 / 6],
             "parameters": {
                 "score_thresholds": [0.5],
                 "hardmax": True,
-                "label": "red",
-            },
-        },
-        {
-            "type": "Accuracy",
-            "value": [2 / 3],
-            "parameters": {
-                "score_thresholds": [0.5],
-                "hardmax": True,
-                "label": "blue",
-            },
-        },
-        {
-            "type": "Accuracy",
-            "value": [5 / 6],
-            "parameters": {
-                "score_thresholds": [0.5],
-                "hardmax": True,
-                "label": "black",
             },
         },
     ]
@@ -237,7 +174,6 @@ def test_accuracy_with_image_example(
             "parameters": {
                 "score_thresholds": [0.0],
                 "hardmax": True,
-                "label": "v4",
             },
         },
     ]
@@ -269,29 +205,10 @@ def test_accuracy_with_tabular_example(
     expected_metrics = [
         {
             "type": "Accuracy",
-            "value": [0.7],
-            "parameters": {
-                "score_thresholds": [0.0],
-                "hardmax": True,
-                "label": "0",
-            },
-        },
-        {
-            "type": "Accuracy",
-            "value": [0.5],
-            "parameters": {
-                "score_thresholds": [0.0],
-                "hardmax": True,
-                "label": "1",
-            },
-        },
-        {
-            "type": "Accuracy",
-            "value": [0.8],
+            "value": [5 / 10],
             "parameters": {
                 "score_thresholds": [0.0],
                 "hardmax": True,
-                "label": "2",
             },
         },
     ]

valor_lite-0.33.13/tests/object_detection/test_accuracy.py ADDED Viewed

@@ -0,0 +1,492 @@
+import numpy as np
+from valor_lite.object_detection import DataLoader, Detection, MetricType
+from valor_lite.object_detection.computation import compute_metrics
+def test__compute_average_precision():
+    sorted_pairs = np.array(
+        [
+            # dt,  gt,  pd,  iou,  gl,  pl, score,
+            [0.0, 0.0, 2.0, 0.25, 0.0, 0.0, 0.95],
+            [0.0, 0.0, 3.0, 0.33333, 0.0, 0.0, 0.9],
+            [0.0, 0.0, 4.0, 0.66667, 0.0, 0.0, 0.65],
+            [0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.1],
+            [0.0, 0.0, 1.0, 0.5, 0.0, 0.0, 0.01],
+        ]
+    )
+    label_metadata = np.array([[1, 5, 0]])
+    iou_thresholds = np.array([0.1, 0.6])
+    score_thresholds = np.array([0.0])
+    (_, _, accuracy, _, _) = compute_metrics(
+        sorted_pairs,
+        label_metadata=label_metadata,
+        iou_thresholds=iou_thresholds,
+        score_thresholds=score_thresholds,
+    )
+    expected = np.array(
+        [
+            [0.2],  # iou = 0.1
+            [0.2],  # iou = 0.6
+        ]
+    )
+    assert (accuracy == expected).all()
+def test_ap_using_torch_metrics_example(
+    torchmetrics_detections: list[Detection],
+):
+    """
+    cf with torch metrics/pycocotools results listed here:
+    https://github.com/Lightning-AI/metrics/blob/107dbfd5fb158b7ae6d76281df44bd94c836bfce/tests/unittests/detection/test_map.py#L231
+    """
+    loader = DataLoader()
+    loader.add_bounding_boxes(torchmetrics_detections)
+    evaluator = loader.finalize()
+    assert evaluator.ignored_prediction_labels == ["3"]
+    assert evaluator.missing_prediction_labels == []
+    assert evaluator.n_datums == 4
+    assert evaluator.n_labels == 6
+    assert evaluator.n_groundtruths == 20
+    assert evaluator.n_predictions == 19
+    metrics = evaluator.evaluate(
+        iou_thresholds=[0.5, 0.75],
+        as_dict=True,
+    )
+    # test Accuracy
+    actual_metrics = [m for m in metrics[MetricType.Accuracy]]
+    expected_metrics = [
+        {
+            "type": "Accuracy",
+            "value": 9 / 19,
+            "parameters": {
+                "iou_threshold": 0.5,
+                "score_threshold": 0.5,
+            },
+        },
+        {
+            "type": "Accuracy",
+            "value": 8 / 19,
+            "parameters": {
+                "iou_threshold": 0.75,
+                "score_threshold": 0.5,
+            },
+        },
+    ]
+    for m in actual_metrics:
+        assert m in expected_metrics
+    for m in expected_metrics:
+        assert m in actual_metrics
+def test_accuracy_metrics_first_class(
+    basic_detections_first_class: list[Detection],
+    basic_rotated_detections_first_class: list[Detection],
+):
+    """
+    Basic object detection test.
+    groundtruths
+        datum uid1
+            box 1 - label v1 - tp
+            box 3 - label v2 - fn missing prediction
+        datum uid2
+            box 2 - label v1 - fn missing prediction
+    predictions
+        datum uid1
+            box 1 - label v1 - score 0.3 - tp
+        datum uid2
+            box 2 - label v2 - score 0.98 - fp
+    """
+    for input_, method in [
+        (basic_detections_first_class, DataLoader.add_bounding_boxes),
+        (basic_rotated_detections_first_class, DataLoader.add_polygons),
+    ]:
+        loader = DataLoader()
+        method(loader, input_)
+        evaluator = loader.finalize()
+        metrics = evaluator.evaluate(
+            iou_thresholds=[0.1, 0.6],
+            score_thresholds=[0.0, 0.5],
+            as_dict=True,
+        )
+        assert evaluator.ignored_prediction_labels == []
+        assert evaluator.missing_prediction_labels == []
+        assert evaluator.n_datums == 2
+        assert evaluator.n_labels == 1
+        assert evaluator.n_groundtruths == 2
+        assert evaluator.n_predictions == 1
+        # test Accuracy
+        actual_metrics = [m for m in metrics[MetricType.Accuracy]]
+        expected_metrics = [
+            {
+                "type": "Accuracy",
+                "value": 1.0,
+                "parameters": {
+                    "iou_threshold": 0.1,
+                    "score_threshold": 0.0,
+                },
+            },
+            {
+                "type": "Accuracy",
+                "value": 1.0,
+                "parameters": {
+                    "iou_threshold": 0.6,
+                    "score_threshold": 0.0,
+                },
+            },
+            {
+                "type": "Accuracy",
+                "value": 0.0,
+                "parameters": {
+                    "iou_threshold": 0.1,
+                    "score_threshold": 0.5,
+                },
+            },
+            {
+                "type": "Accuracy",
+                "value": 0.0,
+                "parameters": {
+                    "iou_threshold": 0.6,
+                    "score_threshold": 0.5,
+                },
+            },
+        ]
+        for m in actual_metrics:
+            assert m in expected_metrics
+        for m in expected_metrics:
+            assert m in actual_metrics
+def test_accuracy_metrics_second_class(
+    basic_detections_second_class: list[Detection],
+    basic_rotated_detections_second_class: list[Detection],
+):
+    """
+    Basic object detection test.
+    groundtruths
+        datum uid1
+            box 3 - label v2 - fn missing prediction
+        datum uid2
+           none
+    predictions
+        datum uid1
+            none
+        datum uid2
+            box 2 - label v2 - score 0.98 - fp
+    """
+    for input_, method in [
+        (basic_detections_second_class, DataLoader.add_bounding_boxes),
+        (basic_rotated_detections_second_class, DataLoader.add_polygons),
+    ]:
+        loader = DataLoader()
+        method(loader, input_)
+        evaluator = loader.finalize()
+        metrics = evaluator.evaluate(
+            iou_thresholds=[0.1, 0.6],
+            score_thresholds=[0.0, 0.5],
+            as_dict=True,
+        )
+        assert evaluator.ignored_prediction_labels == []
+        assert evaluator.missing_prediction_labels == []
+        assert evaluator.n_datums == 2
+        assert evaluator.n_labels == 1
+        assert evaluator.n_groundtruths == 1
+        assert evaluator.n_predictions == 1
+        # test Accuracy
+        actual_metrics = [m for m in metrics[MetricType.Accuracy]]
+        expected_metrics = [
+            {
+                "type": "Accuracy",
+                "value": 0.0,
+                "parameters": {
+                    "iou_threshold": 0.1,
+                    "score_threshold": 0.0,
+                },
+            },
+            {
+                "type": "Accuracy",
+                "value": 0.0,
+                "parameters": {
+                    "iou_threshold": 0.6,
+                    "score_threshold": 0.0,
+                },
+            },
+            {
+                "type": "Accuracy",
+                "value": 0.0,
+                "parameters": {
+                    "iou_threshold": 0.1,
+                    "score_threshold": 0.5,
+                },
+            },
+            {
+                "type": "Accuracy",
+                "value": 0.0,
+                "parameters": {
+                    "iou_threshold": 0.6,
+                    "score_threshold": 0.5,
+                },
+            },
+        ]
+        for m in actual_metrics:
+            assert m in expected_metrics
+        for m in expected_metrics:
+            assert m in actual_metrics
+def test_accuracy_false_negatives_single_datum_baseline(
+    false_negatives_single_datum_baseline_detections: list[Detection],
+):
+    """This is the baseline for the below test. In this case there are two predictions and
+    one groundtruth, but the highest confident prediction overlaps sufficiently with the groundtruth
+    so there is not a penalty for the false negative so the Accuracy is 1
+    """
+    loader = DataLoader()
+    loader.add_bounding_boxes(false_negatives_single_datum_baseline_detections)
+    evaluator = loader.finalize()
+    metrics = evaluator.evaluate(
+        iou_thresholds=[0.5],
+        score_thresholds=[0.0, 0.9],
+        as_dict=True,
+    )
+    actual_metrics = [m for m in metrics[MetricType.Accuracy]]
+    expected_metrics = [
+        {
+            "type": "Accuracy",
+            "value": 0.5,
+            "parameters": {
+                "iou_threshold": 0.5,
+                "score_threshold": 0.0,
+            },
+        },
+        {
+            "type": "Accuracy",
+            "value": 0.0,
+            "parameters": {
+                "iou_threshold": 0.5,
+                "score_threshold": 0.9,
+            },
+        },
+    ]
+    for m in actual_metrics:
+        assert m in expected_metrics
+    for m in expected_metrics:
+        assert m in actual_metrics
+def test_accuracy_false_negatives_single_datum(
+    false_negatives_single_datum_detections: list[Detection],
+):
+    """Tests where high confidence false negative was not being penalized. The
+    difference between this test and the above is that here the prediction with higher confidence
+    does not sufficiently overlap the groundtruth and so is penalized and we get an Accuracy of 0.5
+    """
+    loader = DataLoader()
+    loader.add_bounding_boxes(false_negatives_single_datum_detections)
+    evaluator = loader.finalize()
+    metrics = evaluator.evaluate(
+        iou_thresholds=[0.5],
+        score_thresholds=[0.0],
+        as_dict=True,
+    )
+    actual_metrics = [m for m in metrics[MetricType.Accuracy]]
+    expected_metrics = [
+        {
+            "type": "Accuracy",
+            "value": 0.5,
+            "parameters": {
+                "iou_threshold": 0.5,
+                "score_threshold": 0.0,
+            },
+        }
+    ]
+    for m in actual_metrics:
+        assert m in expected_metrics
+    for m in expected_metrics:
+        assert m in actual_metrics
+def test_accuracy_false_negatives_two_datums_one_empty_low_confidence_of_fp(
+    false_negatives_two_datums_one_empty_low_confidence_of_fp_detections: list[
+        Detection
+    ],
+):
+    """In this test we have
+        1. An image with a matching groundtruth and prediction (same class and high IOU)
+        2. A second image with empty groundtruth annotation but a prediction with lower confidence
+        then the prediction on the first image.
+    In this case, the Accuracy should be 1.0 since the false positive has lower confidence than the true positive
+    """
+    loader = DataLoader()
+    loader.add_bounding_boxes(
+        false_negatives_two_datums_one_empty_low_confidence_of_fp_detections
+    )
+    evaluator = loader.finalize()
+    metrics = evaluator.evaluate(
+        iou_thresholds=[0.5],
+        score_thresholds=[0.0],
+        as_dict=True,
+    )
+    actual_metrics = [m for m in metrics[MetricType.Accuracy]]
+    expected_metrics = [
+        {
+            "type": "Accuracy",
+            "value": 0.5,
+            "parameters": {
+                "iou_threshold": 0.5,
+                "score_threshold": 0.0,
+            },
+        }
+    ]
+    for m in actual_metrics:
+        assert m in expected_metrics
+    for m in expected_metrics:
+        assert m in actual_metrics
+def test_accuracy_false_negatives_two_datums_one_empty_high_confidence_of_fp(
+    false_negatives_two_datums_one_empty_high_confidence_of_fp_detections: list[
+        Detection
+    ],
+):
+    """In this test we have
+        1. An image with a matching groundtruth and prediction (same class and high IOU)
+        2. A second image with empty groundtruth annotation and a prediction with higher confidence
+        then the prediction on the first image.
+    In this case, the Accuracy should be 0.5 since the false positive has higher confidence than the true positive
+    """
+    loader = DataLoader()
+    loader.add_bounding_boxes(
+        false_negatives_two_datums_one_empty_high_confidence_of_fp_detections
+    )
+    evaluator = loader.finalize()
+    metrics = evaluator.evaluate(
+        iou_thresholds=[0.5],
+        score_thresholds=[0.0],
+        as_dict=True,
+    )
+    actual_metrics = [m for m in metrics[MetricType.Accuracy]]
+    expected_metrics = [
+        {
+            "type": "Accuracy",
+            "value": 0.5,
+            "parameters": {
+                "iou_threshold": 0.5,
+                "score_threshold": 0.0,
+            },
+        }
+    ]
+    for m in actual_metrics:
+        assert m in expected_metrics
+    for m in expected_metrics:
+        assert m in actual_metrics
+def test_accuracy_false_negatives_two_datums_one_only_with_different_class_low_confidence_of_fp(
+    false_negatives_two_datums_one_only_with_different_class_low_confidence_of_fp_detections: list[
+        Detection
+    ],
+):
+    """In this test we have
+        1. An image with a matching groundtruth and prediction (same class, `"value"`, and high IOU)
+        2. A second image with a groundtruth annotation with class `"other value"` and a prediction with lower confidence
+        then the prediction on the first image.
+    In this case, the Accuracy for class `"value"` should be 1 since the false positive has lower confidence than the true positive.
+    Accuracy for class `"other value"` should be 0 since there is no prediction for the `"other value"` groundtruth
+    """
+    loader = DataLoader()
+    loader.add_bounding_boxes(
+        false_negatives_two_datums_one_only_with_different_class_low_confidence_of_fp_detections
+    )
+    evaluator = loader.finalize()
+    metrics = evaluator.evaluate(
+        iou_thresholds=[0.5],
+        score_thresholds=[0.0],
+        as_dict=True,
+    )
+    actual_metrics = [m for m in metrics[MetricType.Accuracy]]
+    expected_metrics = [
+        {
+            "type": "Accuracy",
+            "value": 0.5,
+            "parameters": {
+                "iou_threshold": 0.5,
+                "score_threshold": 0.0,
+            },
+        },
+    ]
+    for m in actual_metrics:
+        assert m in expected_metrics
+    for m in expected_metrics:
+        assert m in actual_metrics
+def test_accuracy_false_negatives_two_datums_one_only_with_different_class_high_confidence_of_fp(
+    false_negatives_two_images_one_only_with_different_class_high_confidence_of_fp_detections: list[
+        Detection
+    ],
+):
+    """In this test we have
+        1. An image with a matching groundtruth and prediction (same class, `"value"`, and high IOU)
+        2. A second image with a groundtruth annotation with class `"other value"` and a prediction with higher confidence
+        then the prediction on the first image.
+    In this case, the Accuracy for class `"value"` should be 0.5 since the false positive has higher confidence than the true positive.
+    Accuracy for class `"other value"` should be 0 since there is no prediction for the `"other value"` groundtruth
+    """
+    loader = DataLoader()
+    loader.add_bounding_boxes(
+        false_negatives_two_images_one_only_with_different_class_high_confidence_of_fp_detections
+    )
+    evaluator = loader.finalize()
+    metrics = evaluator.evaluate(
+        iou_thresholds=[0.5],
+        score_thresholds=[0.0],
+        as_dict=True,
+    )
+    actual_metrics = [m for m in metrics[MetricType.Accuracy]]
+    expected_metrics = [
+        {
+            "type": "Accuracy",
+            "value": 0.5,
+            "parameters": {
+                "iou_threshold": 0.5,
+                "score_threshold": 0.0,
+            },
+        },
+    ]
+    for m in actual_metrics:
+        assert m in expected_metrics
+    for m in expected_metrics:
+        assert m in actual_metrics

{valor_lite-0.33.11 → valor_lite-0.33.13}/tests/object_detection/test_average_precision.py RENAMED Viewed

@@ -24,7 +24,7 @@ def test__compute_average_precision():
     iou_thresholds = np.array([0.1, 0.6])
     score_thresholds = np.array([0.0])
-    (results, _, _, _,) = compute_metrics(
+    (results, _, _, _, _) = compute_metrics(
         sorted_pairs,
         label_metadata=label_metadata,
         iou_thresholds=iou_thresholds,

{valor_lite-0.33.11 → valor_lite-0.33.13}/tests/object_detection/test_average_recall.py RENAMED Viewed

@@ -25,7 +25,7 @@ def test__compute_average_recall():
     iou_thresholds = np.array([0.1, 0.6])
     score_thresholds = np.array([0.5, 0.93, 0.98])
-    (_, results, _, _,) = compute_metrics(
+    (_, results, _, _, _,) = compute_metrics(
         sorted_pairs,
         label_metadata=label_metadata,
         iou_thresholds=iou_thresholds,

{valor_lite-0.33.11 → valor_lite-0.33.13}/tests/object_detection/test_pr_curve.py RENAMED Viewed

@@ -24,7 +24,7 @@ def test_pr_curve_simple():
     iou_thresholds = np.array([0.1, 0.6])
     score_thresholds = np.array([0.0])
-    (_, _, _, pr_curve) = compute_metrics(
+    (_, _, _, _, pr_curve) = compute_metrics(
         sorted_pairs,
         label_metadata=label_metadata,
         iou_thresholds=iou_thresholds,

{valor_lite-0.33.11 → valor_lite-0.33.13}/valor_lite/classification/computation.py RENAMED Viewed

@@ -182,9 +182,9 @@ def compute_metrics(
         out=precision,
     )
-    accuracy = np.zeros_like(recall)
+    accuracy = np.zeros(n_scores, dtype=np.float64)
     np.divide(
-        (counts[:, :, 0] + counts[:, :, 3]),
+        counts[:, :, 0].sum(axis=1),
         float(n_datums),
         out=accuracy,
     )

{valor_lite-0.33.11 → valor_lite-0.33.13}/valor_lite/classification/manager.py RENAMED Viewed

@@ -367,6 +367,14 @@ class Evaluator:
             )
         ]
+        metrics[MetricType.Accuracy] = [
+            Accuracy(
+                value=accuracy.astype(float).tolist(),
+                score_thresholds=score_thresholds,
+                hardmax=hardmax,
+            )
+        ]
         for label_idx, label in self.index_to_label.items():
             kwargs = {
@@ -401,12 +409,6 @@ class Evaluator:
                     **kwargs,
                 )
             )
-            metrics[MetricType.Accuracy].append(
-                Accuracy(
-                    value=accuracy[:, label_idx].astype(float).tolist(),
-                    **kwargs,
-                )
-            )
             metrics[MetricType.F1].append(
                 F1(
                     value=f1_score[:, label_idx].astype(float).tolist(),

{valor_lite-0.33.11 → valor_lite-0.33.13}/valor_lite/classification/metric.py RENAMED Viewed

@@ -158,24 +158,23 @@ class Recall(_ThresholdValue):
     pass
-class Accuracy(_ThresholdValue):
+class F1(_ThresholdValue):
     """
-    Accuracy metric for a specific class label.
+    F1 score for a specific class label.
-    This class calculates the accuracy at various score thresholds for a binary
-    classification task. Accuracy is defined as the ratio of the sum of true positives and
-    true negatives over all predictions.
+    This class calculates the F1 score at various score thresholds for a binary
+    classification task.
     Attributes
     ----------
     value : list[float]
-        Accuracy values computed at each score threshold.
+        F1 scores computed at each score threshold.
     score_thresholds : list[float]
-        Score thresholds at which the accuracy values are computed.
+        Score thresholds at which the F1 scores are computed.
     hardmax : bool
         Indicates whether hardmax thresholding was used.
     label : str
-        The class label for which the accuracy is computed.
+        The class label for which the F1 score is computed.
     Methods
     -------
@@ -188,23 +187,21 @@ class Accuracy(_ThresholdValue):
     pass
-class F1(_ThresholdValue):
+@dataclass
+class Accuracy:
     """
-    F1 score for a specific class label.
+    Multiclass accuracy metric.
-    This class calculates the F1 score at various score thresholds for a binary
-    classification task.
+    This class calculates the accuracy at various score thresholds.
     Attributes
     ----------
     value : list[float]
-        F1 scores computed at each score threshold.
+        Accuracy values computed at each score threshold.
     score_thresholds : list[float]
-        Score thresholds at which the F1 scores are computed.
+        Score thresholds at which the accuracy values are computed.
     hardmax : bool
         Indicates whether hardmax thresholding was used.
-    label : str
-        The class label for which the F1 score is computed.
     Methods
     -------
@@ -214,7 +211,22 @@ class F1(_ThresholdValue):
         Converts the instance to a dictionary representation.
     """
-    pass
+    value: list[float]
+    score_thresholds: list[float]
+    hardmax: bool
+    def to_metric(self) -> Metric:
+        return Metric(
+            type=type(self).__name__,
+            value=self.value,
+            parameters={
+                "score_thresholds": self.score_thresholds,
+                "hardmax": self.hardmax,
+            },
+        )
+    def to_dict(self) -> dict:
+        return self.to_metric().to_dict()
 @dataclass

{valor_lite-0.33.11 → valor_lite-0.33.13}/valor_lite/object_detection/computation.py RENAMED Viewed

@@ -282,6 +282,7 @@ def compute_metrics(
     ],
     NDArray[np.float64],
     NDArray[np.float64],
+    NDArray[np.float64],
 ]:
     """
     Computes Object Detection metrics.
@@ -309,13 +310,15 @@ def compute_metrics(
     Returns
     -------
-    tuple[NDArray, NDArray, NDArray, float]
+    tuple[NDArray[np.float64], NDArray[np.float64], NDArray[np.float64], float]
         Average Precision results.
-    tuple[NDArray, NDArray, NDArray, float]
+    tuple[NDArray[np.float64], NDArray[np.float64], NDArray[np.float64], float]
         Average Recall results.
-    np.ndarray
-        Precision, Recall, TP, FP, FN, F1 Score, Accuracy.
-    np.ndarray
+    NDArray[np.float64]
+        Accuracy.
+    NDArray[np.float64]
+        Precision, Recall, TP, FP, FN, F1 Score.
+    NDArray[np.float64]
         Interpolated Precision-Recall Curves.
     """
@@ -329,9 +332,10 @@ def compute_metrics(
     elif n_scores == 0:
         raise ValueError("At least one score threshold must be passed.")
-    average_precision = np.zeros((n_ious, n_labels))
-    average_recall = np.zeros((n_scores, n_labels))
-    counts = np.zeros((n_ious, n_scores, n_labels, 7))
+    average_precision = np.zeros((n_ious, n_labels), dtype=np.float64)
+    average_recall = np.zeros((n_scores, n_labels), dtype=np.float64)
+    accuracy = np.zeros((n_ious, n_scores), dtype=np.float64)
+    counts = np.zeros((n_ious, n_scores, n_labels, 6), dtype=np.float64)
     pd_labels = data[:, 5].astype(np.int32)
     scores = data[:, 6]
@@ -417,14 +421,6 @@ def compute_metrics(
                 out=f1_score,
             )
-            accuracy = np.zeros_like(tp_count)
-            np.divide(
-                tp_count,
-                (gt_count + pd_count),
-                where=(gt_count + pd_count) > 1e-9,
-                out=accuracy,
-            )
             counts[iou_idx][score_idx] = np.concatenate(
                 (
                     tp_count[:, np.newaxis],
@@ -433,11 +429,18 @@ def compute_metrics(
                     precision[:, np.newaxis],
                     recall[:, np.newaxis],
                     f1_score[:, np.newaxis],
-                    accuracy[:, np.newaxis],
                 ),
                 axis=1,
             )
+            # caluculate accuracy
+            total_pd_count = label_metadata[:, 1].sum()
+            accuracy[iou_idx, score_idx] = (
+                (tp_count.sum() / total_pd_count)
+                if total_pd_count > 1e-9
+                else 0.0
+            )
             # calculate recall for AR
             average_recall[score_idx] += recall
@@ -552,6 +555,7 @@ def compute_metrics(
     return (
         ap_results,
         ar_results,
+        accuracy,
         counts,
         pr_curve,
     )

{valor_lite-0.33.11 → valor_lite-0.33.13}/valor_lite/object_detection/manager.py RENAMED Viewed

@@ -506,6 +506,7 @@ class Evaluator:
                 average_recall_averaged_over_scores,
                 mean_average_recall_averaged_over_scores,
             ),
+            accuracy,
             precision_recall,
             pr_curves,
         ) = compute_metrics(
@@ -593,6 +594,16 @@ class Evaluator:
             )
         ]
+        metrics[MetricType.Accuracy] = [
+            Accuracy(
+                value=float(accuracy[iou_idx, score_idx]),
+                iou_threshold=iou_thresholds[iou_idx],
+                score_threshold=score_thresholds[score_idx],
+            )
+            for iou_idx in range(accuracy.shape[0])
+            for score_idx in range(accuracy.shape[1])
+        ]
         metrics[MetricType.PrecisionRecallCurve] = [
             PrecisionRecallCurve(
                 precisions=pr_curves[iou_idx, label_idx, :, 0]
@@ -650,12 +661,6 @@ class Evaluator:
                             **kwargs,
                         )
                     )
-                    metrics[MetricType.Accuracy].append(
-                        Accuracy(
-                            value=float(row[6]),
-                            **kwargs,
-                        )
-                    )
         if as_dict:
             return {

{valor_lite-0.33.11 → valor_lite-0.33.13}/valor_lite/object_detection/metric.py RENAMED Viewed

@@ -160,9 +160,9 @@ class Recall(_ClassMetric):
     pass
-class Accuracy(_ClassMetric):
+class F1(_ClassMetric):
     """
-    Accuracy metric for a specific class label in object detection.
+    F1 score for a specific class label in object detection.
     This class encapsulates a metric value for a particular class label,
     along with the associated Intersection over Union (IoU) threshold and
@@ -190,20 +190,18 @@ class Accuracy(_ClassMetric):
     pass
-class F1(_ClassMetric):
+@dataclass
+class Accuracy:
     """
-    F1 score for a specific class label in object detection.
+    Accuracy metric for the object detection task type.
-    This class encapsulates a metric value for a particular class label,
-    along with the associated Intersection over Union (IoU) threshold and
-    confidence score threshold.
+    This class encapsulates a metric value at a specific Intersection
+    over Union (IoU) threshold and confidence score threshold.
     Attributes
     ----------
     value : float
         The metric value.
-    label : str
-        The class label for which the metric is calculated.
     iou_threshold : float
         The IoU threshold used to determine matches between predicted and ground truth boxes.
     score_threshold : float
@@ -217,7 +215,22 @@ class F1(_ClassMetric):
         Converts the instance to a dictionary representation.
     """
-    pass
+    value: float
+    iou_threshold: float
+    score_threshold: float
+    def to_metric(self) -> Metric:
+        return Metric(
+            type=type(self).__name__,
+            value=self.value,
+            parameters={
+                "iou_threshold": self.iou_threshold,
+                "score_threshold": self.score_threshold,
+            },
+        )
+    def to_dict(self) -> dict:
+        return self.to_metric().to_dict()
 @dataclass

{valor_lite-0.33.11 → valor_lite-0.33.13/valor_lite.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: valor-lite
-Version: 0.33.11
+Version: 0.33.13
 Summary: Compute valor metrics locally.
 License: MIT License

{valor_lite-0.33.11 → valor_lite-0.33.13}/valor_lite.egg-info/SOURCES.txt RENAMED Viewed

@@ -24,6 +24,7 @@ tests/classification/test_schemas.py
 tests/classification/test_stability.py
 tests/object_detection/__init__.py
 tests/object_detection/conftest.py
+tests/object_detection/test_accuracy.py
 tests/object_detection/test_average_precision.py
 tests/object_detection/test_average_recall.py
 tests/object_detection/test_confusion_matrix.py