scaleapi · sasha-scale · Apr 19, 2022 · Apr 19, 2022 · Apr 23, 2022 · gatli
diff --git a/nucleus/metrics/base.py b/nucleus/metrics/base.py
@@ -11,6 +11,8 @@
 )
 from nucleus.prediction import PredictionList
 
+EPSILON = 10 ** -4  # 0.0001
+
 
 class MetricResult(ABC):
     """Base MetricResult class"""
@@ -41,6 +43,14 @@ def aggregate(results: Iterable["ScalarResult"]) -> "ScalarResult":
         value = total_value / max(total_weight, sys.float_info.epsilon)
         return ScalarResult(value, total_weight)
 
+    def __eq__(self, other):
+        if not isinstance(other, self.__class__):
+            return False
+        return (
+            abs(self.value - other.value) < EPSILON
+            and self.weight == other.weight
+        )
+
 
 class Metric(ABC):
     """Abstract class for defining a metric, which takes a list of annotations

diff --git a/nucleus/metrics/cuboid_metrics.py b/nucleus/metrics/cuboid_metrics.py
@@ -1,4 +1,5 @@
 import sys
+import warnings
 from abc import abstractmethod
 from typing import List, Optional, Union
 
@@ -10,6 +11,9 @@
 from .filtering import ListOfAndFilters, ListOfOrAndFilters
 from .filters import confidence_filter
 
+DEFAULT_IOU_THRESHOLD = 0.1
+DEFAULT_CONFIDENCE_THRESHOLD = 0.0
+
 
 class CuboidMetric(Metric):
     """Abstract class for metrics of cuboids.
@@ -28,7 +32,7 @@ class CuboidMetric(Metric):
     def __init__(
         self,
         enforce_label_match: bool = False,
-        confidence_threshold: float = 0.0,
+        confidence_threshold: Optional[float] = None,
         annotation_filters: Optional[
             Union[ListOfOrAndFilters, ListOfAndFilters]
         ] = None,
@@ -54,6 +58,11 @@ def __init__(
                 (AND), forming a more selective and multiple column predicate. Finally, the most outer list combines
                 these filters as a disjunction (OR).
         """
+        if not confidence_threshold:
+            confidence_threshold = DEFAULT_CONFIDENCE_THRESHOLD
+            warnings.warn(
+                f"Got confidence_threshold value of `None`. In this case, we set the confidence_threshold to {confidence_threshold} (include all predictions, regardless of confidence).  Consider specifying this value explicitly during metric initialization"
+            )
         self.enforce_label_match = enforce_label_match
         assert 0 <= confidence_threshold <= 1
         self.confidence_threshold = confidence_threshold
@@ -99,8 +108,8 @@ class CuboidIOU(CuboidMetric):
     def __init__(
         self,
         enforce_label_match: bool = True,
-        iou_threshold: float = 0.0,
-        confidence_threshold: float = 0.0,
+        iou_threshold: Optional[float] = None,
+        confidence_threshold: Optional[float] = None,
         iou_2d: bool = False,
         annotation_filters: Optional[
             Union[ListOfOrAndFilters, ListOfAndFilters]
@@ -127,6 +136,11 @@ def __init__(
                 interpreted as a conjunction (AND), forming a more selective and multiple column predicate.
                 Finally, the most outer list combines these filters as a disjunction (OR).
         """
+        if not iou_threshold:
+            iou_threshold = DEFAULT_IOU_THRESHOLD
+            warnings.warn(
+                f"The IoU threshold used for matching was initialized to `None`. In this case, the value of iou_threshold defaults to {iou_threshold}. If this values will produce unexpected behavior, consider specifying the iou_threshold argument during metric initialization"
+            )
         assert (
             0 <= iou_threshold <= 1
         ), "IoU threshold must be between 0 and 1."
@@ -147,13 +161,15 @@ def eval(
         iou_3d_metric, iou_2d_metric = detection_iou(
             predictions,
             annotations,
-            threshold_in_overlap_ratio=self.iou_threshold,
+            self.iou_threshold,
+            self.enforce_label_match,
         )
 
-        weight = max(len(annotations), len(predictions))
         if self.iou_2d:
+            weight = len(iou_2d_metric)
             avg_iou = iou_2d_metric.sum() / max(weight, sys.float_info.epsilon)
         else:
+            weight = len(iou_3d_metric)
             avg_iou = iou_3d_metric.sum() / max(weight, sys.float_info.epsilon)
 
         return ScalarResult(avg_iou, weight)
@@ -166,8 +182,8 @@ class CuboidPrecision(CuboidMetric):
     def __init__(
         self,
         enforce_label_match: bool = True,
-        iou_threshold: float = 0.0,
-        confidence_threshold: float = 0.0,
+        iou_threshold: Optional[float] = None,
+        confidence_threshold: Optional[float] = None,
         annotation_filters: Optional[
             Union[ListOfOrAndFilters, ListOfAndFilters]
         ] = None,
@@ -192,6 +208,11 @@ def __init__(
                 interpreted as a conjunction (AND), forming a more selective and multiple column predicate.
                 Finally, the most outer list combines these filters as a disjunction (OR).
         """
+        if not iou_threshold:
+            iou_threshold = DEFAULT_IOU_THRESHOLD
+            warnings.warn(
+                f"The IoU threshold used for matching was initialized to `None`. In this case, the value of iou_threshold defaults to {iou_threshold}. If this values will produce unexpected behavior, consider specifying the iou_threshold argument during metric initialization"
+            )
         assert (
             0 <= iou_threshold <= 1
         ), "IoU threshold must be between 0 and 1."
@@ -211,7 +232,9 @@ def eval(
         stats = recall_precision(
             predictions,
             annotations,
-            threshold_in_overlap_ratio=self.iou_threshold,
+            self.iou_threshold,
+            self.confidence_threshold,
+            self.enforce_label_match,
         )
         weight = stats["tp_sum"] + stats["fp_sum"]
         precision = stats["tp_sum"] / max(weight, sys.float_info.epsilon)
@@ -225,8 +248,8 @@ class CuboidRecall(CuboidMetric):
     def __init__(
         self,
         enforce_label_match: bool = True,
-        iou_threshold: float = 0.0,
-        confidence_threshold: float = 0.0,
+        iou_threshold: Optional[float] = None,
+        confidence_threshold: Optional[float] = None,
         annotation_filters: Optional[
             Union[ListOfOrAndFilters, ListOfAndFilters]
         ] = None,
@@ -241,6 +264,11 @@ def __init__(
             iou_threshold: IOU threshold to consider detection as valid. Must be in [0, 1]. Default 0.0
             confidence_threshold: minimum confidence threshold for predictions. Must be in [0, 1]. Default 0.0
         """
+        if not iou_threshold:
+            iou_threshold = DEFAULT_IOU_THRESHOLD
+            warnings.warn(
+                f"The IoU threshold used for matching was initialized to `None`. In this case, the value of iou_threshold defaults to {iou_threshold}. If this values will produce unexpected behavior, consider specifying the iou_threshold argument during metric initialization"
+            )
         assert (
             0 <= iou_threshold <= 1
         ), "IoU threshold must be between 0 and 1."
@@ -260,7 +288,9 @@ def eval(
         stats = recall_precision(
             predictions,
             annotations,
-            threshold_in_overlap_ratio=self.iou_threshold,
+            self.iou_threshold,
+            self.confidence_threshold,
+            self.enforce_label_match,
         )
         weight = stats["tp_sum"] + stats["fn_sum"]
         recall = stats["tp_sum"] / max(weight, sys.float_info.epsilon)

diff --git a/nucleus/metrics/cuboid_utils.py b/nucleus/metrics/cuboid_utils.py
@@ -101,18 +101,25 @@ def wrapper(
     return wrapper
 
 
-def process_dataitem(dataitem):
+def process_dataitem(item_list, confidence_threshold=None):
+    if confidence_threshold:
+        item_list = [
+            item
+            for item in item_list
+            if item.confidence >= confidence_threshold
+        ]
     processed_item = {}
     processed_item["xyz"] = np.array(
-        [[ann.position.x, ann.position.y, ann.position.z] for ann in dataitem]
+        [[ann.position.x, ann.position.y, ann.position.z] for ann in item_list]
     )
     processed_item["wlh"] = np.array(
         [
             [ann.dimensions.x, ann.dimensions.y, ann.dimensions.z]
-            for ann in dataitem
+            for ann in item_list
         ]
     )
-    processed_item["yaw"] = np.array([ann.yaw for ann in dataitem])
+    processed_item["yaw"] = np.array([ann.yaw for ann in item_list])
+    processed_item["labels"] = [ann.label for ann in item_list]
     return processed_item
 
 
@@ -278,6 +285,8 @@ def recall_precision(
     prediction: List[CuboidPrediction],
     groundtruth: List[CuboidAnnotation],
     threshold_in_overlap_ratio: float,
+    confidence_threshold: float,
+    enforce_label_match: bool,
 ) -> Dict[str, float]:
     """
     Calculates the precision and recall of each lidar frame.
@@ -295,7 +304,7 @@ def recall_precision(
     num_instances = 0
 
     gt_items = process_dataitem(groundtruth)
-    pred_items = process_dataitem(prediction)
+    pred_items = process_dataitem(prediction, confidence_threshold)
 
     num_predicted += pred_items["xyz"].shape[0]
     num_instances += gt_items["xyz"].shape[0]
@@ -317,6 +326,10 @@ def recall_precision(
     for pred_id, gt_id in mapping:
         if fn[gt_id] == 0:
             continue
+        if enforce_label_match and not (
+            gt_items["labels"][gt_id] == pred_items["labels"][pred_id]
+        ):
+            continue
         tp[pred_id] = 1
         fp[pred_id] = 0
         fn[gt_id] = 0
@@ -340,6 +353,7 @@ def detection_iou(
     prediction: List[CuboidPrediction],
     groundtruth: List[CuboidAnnotation],
     threshold_in_overlap_ratio: float,
+    enforce_label_match: bool,
 ) -> Tuple[np.ndarray, np.ndarray]:
     """
     Calculates the 2D IOU and 3D IOU overlap between predictions and groundtruth.
@@ -370,8 +384,13 @@ def detection_iou(
     )
 
     for i, m in enumerate(iou_3d.max(axis=1)):
+        j = iou_3d[i].argmax()
+        if (
+            enforce_label_match
+            and gt_items["labels"][i] != pred_items["labels"][j]
+        ):
+            continue
         if m >= threshold_in_overlap_ratio:
-            j = iou_3d[i].argmax()
             meter_3d.append(iou_3d[i, j])
             meter_2d.append(iou_2d[i, j])