update docstrings

Matt Sokoloff · Matt Sokoloff · commit ab01346ff572 · 2021-09-13T06:44:19.000-04:00
diff --git a/labelbox/data/annotation_types/__init__.py b/labelbox/data/annotation_types/__init__.py
@@ -32,3 +32,5 @@
 from .metrics import ScalarMetricAggregation
 from .metrics import ConfusionMatrixMetric
 from .metrics import ConfusionMatrixAggregation
+from .metrics import ScalarMetricValue
+from .metrics import ConfusionMatrixMetricValue
diff --git a/labelbox/data/annotation_types/metrics/__init__.py b/labelbox/data/annotation_types/metrics/__init__.py
@@ -1,2 +1,2 @@
-from .scalar import ScalarMetric, ScalarMetricAggregation
-from .confusion_matrix import ConfusionMatrixMetric, ConfusionMatrixAggregation
+from .scalar import ScalarMetric, ScalarMetricAggregation, ScalarMetricValue
+from .confusion_matrix import ConfusionMatrixMetric, ConfusionMatrixAggregation, ConfusionMatrixMetricValue
diff --git a/labelbox/data/metrics/confusion_matrix/calculation.py b/labelbox/data/metrics/confusion_matrix/calculation.py
@@ -1,14 +1,13 @@
-from labelbox.data.metrics.iou.calculation import _get_mask_pairs, _get_vector_pairs, miou
-
-from labelbox.data.annotation_types.metrics.confusion_matrix import \
-    ConfusionMatrixMetricValue
-
-from labelbox.data.annotation_types.metrics.scalar import ScalarMetricValue
 from typing import List, Optional, Tuple, Union
+
 import numpy as np
+
+from ..iou.calculation import _get_mask_pairs, _get_vector_pairs, miou
 from ...annotation_types import (ObjectAnnotation, ClassificationAnnotation,
-                                 Mask, Geometry, Checklist, Radio)
-from ..processing import get_feature_pairs, get_identifying_key, has_no_annotations, has_no_matching_annotations
+                                 Mask, Geometry, Checklist, Radio,
+                                 ScalarMetricValue, ConfusionMatrixMetricValue)
+from ..processing import (get_feature_pairs, get_identifying_key,
+                          has_no_annotations, has_no_matching_annotations)
 
 
 def confusion_matrix(ground_truths: List[Union[ObjectAnnotation,
@@ -17,34 +16,58 @@ def confusion_matrix(ground_truths: List[Union[ObjectAnnotation,
                                              ClassificationAnnotation]],
                      include_subclasses: bool,
                      iou: float) -> ConfusionMatrixMetricValue:
+    """
+    Computes the confusion matrix for an arbitrary set of ground truth and predicted annotations.
+    It first computes the confusion matrix for each metric and then sums across all classes
+
+    Args:
+        ground_truth : Label containing human annotations or annotations known to be correct
+        prediction: Label representing model predictions
+        include_subclasses (bool): Whether or not to include subclasses in the calculation.
+            If set to True, the iou between two overlapping objects of the same type is 0 if the subclasses are not the same.
+        iou: minimum overlap between objects for them to count as matching
+    Returns:
+        confusion matrix as a list: [TP,FP,TN,FN]
+        Returns None if there are no annotations in ground_truth or prediction annotations
+    """
 
     annotation_pairs = get_feature_pairs(predictions, ground_truths)
-    ious = [
+    conf_matrix = [
         feature_confusion_matrix(annotation_pair[0], annotation_pair[1],
                                  include_subclasses, iou)
         for annotation_pair in annotation_pairs.values()
     ]
-    ious = [iou for iou in ious if iou is not None]
-
-    return None if not len(ious) else np.sum(ious, axis=0).tolist()
+    matrices = [matrix for matrix in conf_matrix if matrix is not None]
+    return None if not len(matrices) else np.sum(matrices, axis=0).tolist()
 
 
 def feature_confusion_matrix(
         ground_truths: List[Union[ObjectAnnotation, ClassificationAnnotation]],
         predictions: List[Union[ObjectAnnotation, ClassificationAnnotation]],
         include_subclasses: bool,
         iou: float) -> Optional[ConfusionMatrixMetricValue]:
+    """
+    Computes confusion matrix for all features of the same class.
+
+    Args:
+        ground_truths: List of ground truth annotations belonging to the same class.
+        predictions: List of annotations  belonging to the same class.
+        include_subclasses (bool): Whether or not to include subclasses in the calculation.
+            If set to True, the iou between two overlapping objects of the same type is 0 if the subclasses are not the same.
+    Returns:
+        confusion matrix as a list: [TP,FP,TN,FN]
+        Returns None if there are no annotations in ground_truth or prediction annotations
+    """
     if has_no_matching_annotations(ground_truths, predictions):
         return [0, int(len(predictions) > 0), 0, int(len(ground_truths) > 0)]
     elif has_no_annotations(ground_truths, predictions):
-        # Note that we could return [0,0,0,0] but that will bloat the imports for no reason
         return None
     elif isinstance(predictions[0].value, Mask):
-        return mask_confusion_matrix(ground_truths, predictions, iou,
-                                     include_subclasses)
+        return mask_confusion_matrix(ground_truths, predictions,
+                                     include_subclasses, iou)
     elif isinstance(predictions[0].value, Geometry):
-        return vector_confusion_matrix(ground_truths, predictions, iou,
-                                       include_subclasses)
+        return vector_confusion_matrix(ground_truths, predictions,
+                                       include_subclasses, iou)
     elif isinstance(predictions[0], ClassificationAnnotation):
         return classification_confusion_matrix(ground_truths, predictions)
     else:
@@ -63,7 +86,8 @@ def classification_confusion_matrix(
         ground_truths: List of ground truth classification annotations
         predictions: List of prediction classification annotations
     Returns:
-        float representing the iou score for the classification
+        confusion matrix as a list: [TP,FP,TN,FN]
+        Returns None if there are no annotations in ground_truth or prediction annotations
     """
 
     if has_no_matching_annotations(ground_truths, predictions):
@@ -86,27 +110,56 @@ def classification_confusion_matrix(
     elif isinstance(prediction.value, Checklist):
         return checklist_confusion_matrix(ground_truth.value, prediction.value)
     else:
-        raise ValueError(f"Unsupported subclass. {prediction}.")
+        raise ValueError(
+            f"Unsupported subclass. {prediction}. Only Radio and Checklist are supported"
+        )
 
 
 def vector_confusion_matrix(ground_truths: List[ObjectAnnotation],
                             predictions: List[ObjectAnnotation],
-                            iou: float,
                             include_subclasses: bool,
+                            iou: float,
                             buffer=70.) -> Optional[ConfusionMatrixMetricValue]:
+    """
+    Computes confusion matrix for any vector class (point, polygon, line, rectangle).
+    Ground truths and predictions should all belong to the same class.
+
+    Args:
+        ground_truths: List of ground truth vector annotations
+        predictions: List of prediction vector annotations
+        iou: minimum overlap between objects for them to count as matching
+        include_subclasses (bool): Whether or not to include subclasses in the calculation.
+            If set to True, the iou between two overlapping objects of the same type is 0 if the subclasses are not the same.
+        buffer: How much to buffer point and lines (used for determining if overlap meets iou threshold )
+    Returns:
+        confusion matrix as a list: [TP,FP,TN,FN]
+         Returns None if there are no annotations in ground_truth or prediction annotations
+    """
     if has_no_matching_annotations(ground_truths, predictions):
         return [0, int(len(predictions) > 0), 0, int(len(ground_truths) > 0)]
     elif has_no_annotations(ground_truths, predictions):
         return None
 
     pairs = _get_vector_pairs(ground_truths, predictions, buffer=buffer)
-    return object_pair_confusion_matrix(pairs, iou, include_subclasses)
+    return object_pair_confusion_matrix(pairs, include_subclasses, iou)
 
 
-def object_pair_confusion_matrix(
-        pairs: List[Tuple[ObjectAnnotation, ObjectAnnotation,
-                          ScalarMetricValue]], iou,
-        include_subclasses) -> ConfusionMatrixMetricValue:
+def object_pair_confusion_matrix(pairs: List[Tuple[ObjectAnnotation,
+                                                   ObjectAnnotation,
+                                                   ScalarMetricValue]],
+                                 include_subclasses: bool,
+                                 iou: float) -> ConfusionMatrixMetricValue:
+    """
+    Computes the confusion matrix for a list of object annotation pairs.
+    Performs greedy matching of pairs.
+
+    Args:
+        pairs : A list of object annotation pairs with an iou score.
+            This is used to determine matching priority (or if objects are matching at all) since objects can only be matched once.
+        iou : iou threshold to deterine if objects are matching
+    Returns:
+        confusion matrix as a list: [TP,FP,TN,FN]
+    """
     pairs.sort(key=lambda triplet: triplet[2], reverse=True)
     prediction_ids = set()
     ground_truth_ids = set()
@@ -144,11 +197,10 @@ def radio_confusion_matrix(ground_truth: Radio,
     """
     Calculates confusion between ground truth and predicted radio values
 
-    The way we are calculating confusion matrix metrics:
-        - TNs aren't defined because we don't know how many other classes exist ... etc
-
-    When P == L, then we get [1,0,0,0]
-    when P != L, we get [0,1,0,1]
+    Calculation:
+        - TNs aren't defined because we don't know how many other classes exist
+        - When P == L, then we get [1,0,0,0]
+        - when P != L, we get [0,1,0,1]
 
     This is because we are aggregating the stats for the entire radio. Not for each class.
     Since we are not tracking TNs (P == L) only adds to TP.
@@ -169,9 +221,16 @@ def checklist_confusion_matrix(
         ground_truth: Checklist,
         prediction: Checklist) -> ConfusionMatrixMetricValue:
     """
-    Calculates agreement between ground truth and predicted checklist items
+    Calculates agreement between ground truth and predicted checklist items:
+
+    Calculation:
+        - When a prediction matches a label that counts as a true postivie.
+        - When a prediction was made and does not have a corresponding label this is counted as a false postivie
+        - When a label does not have a corresponding prediction this is counted as a false negative
+
+    We are also not tracking TNs since we don't know the number of possible classes
+     (and they aren't necessary for precision/recall/f1).
 
-    Also not tracking TNs
     """
     key = get_identifying_key(prediction.answer, ground_truth.answer)
     schema_ids_pred = {getattr(answer, key) for answer in prediction.answer}
@@ -185,33 +244,35 @@ def checklist_confusion_matrix(
     return [tps, fps, 0, fns]
 
 
-def mask_confusion_matrix(
-        ground_truths: List[ObjectAnnotation],
-        predictions: List[ObjectAnnotation], iou,
-        include_subclasses: bool) -> Optional[ScalarMetricValue]:
+def mask_confusion_matrix(ground_truths: List[ObjectAnnotation],
+                          predictions: List[ObjectAnnotation],
+                          include_subclasses: bool,
+                          iou: float) -> Optional[ScalarMetricValue]:
     """
-    Computes iou score for all features with the same feature schema id.
-    Calculation includes subclassifications.
+    Computes confusion matrix metric for two masks
+
+    Important:
+        - If including subclasses in the calculation, then the metrics are computed the same as if it were object detection.
+        - Each mask is its own instance. Otherwise this metric is computed as pixel level annotations.
 
     Args:
         ground_truths: List of ground truth mask annotations
         predictions: List of prediction mask annotations
     Returns:
-        float representing the iou score for the masks
+        confusion matrix as a list: [TP,FP,TN,FN]
     """
     if has_no_matching_annotations(ground_truths, predictions):
         return [0, int(len(predictions) > 0), 0, int(len(ground_truths) > 0)]
     elif has_no_annotations(ground_truths, predictions):
         return None
 
     if include_subclasses:
-        # This results in a faily drastically different value.
+        # This results in a faily drastically different value than without subclasses.
         # If we have subclasses set to True, then this is object detection with masks
-        # Otherwise this will flatten the masks.
-        # TODO: Make this more apprent in the configuration.
+        # Otherwise this will compute metrics on each pixel.
         pairs = _get_mask_pairs(ground_truths, predictions)
         return object_pair_confusion_matrix(
-            pairs, iou, include_subclasses=include_subclasses)
+            pairs, include_subclasses=include_subclasses, iou=iou)
 
     prediction_np = np.max([pred.value.draw(color=1) for pred in predictions],
                            axis=0)
diff --git a/labelbox/data/metrics/confusion_matrix/confusion_matrix.py b/labelbox/data/metrics/confusion_matrix/confusion_matrix.py
@@ -19,17 +19,17 @@ def confusion_matrix_metric(ground_truths: List[Union[
                             include_subclasses=True,
                             iou=0.5) -> List[ConfusionMatrixMetric]:
     """
-    Computes miou between two sets of annotations.
+    Computes confusion matrix metrics between two sets of annotations.
     This will most commonly be used for data row level metrics.
-    Each class in the annotation list is weighted equally in the iou score.
+    On the front end these will be displayed as precision, recall, and f1 scores.
 
     Args:
         ground_truth : Label containing human annotations or annotations known to be correct
         prediction: Label representing model predictions
-        include_subclasses (bool): Whether or not to include subclasses in the iou calculation.
+        include_subclasses (bool): Whether or not to include subclasses in the calculation.
             If set to True, the iou between two overlapping objects of the same type is 0 if the subclasses are not the same.
     Returns:
-        Returns a list of ScalarMetrics. Will be empty if there were no predictions and labels. Otherwise a single metric will be returned.
+        Returns a list of ConfusionMatrixMetrics. Will be empty if there were no predictions and labels. Otherwise a single metric will be returned.
     """
     if not (0. < iou < 1.):
         raise ValueError("iou must be between 0 and 1")
@@ -53,15 +53,16 @@ def feature_confusion_matrix_metric(
     iou: float = 0.5,
 ) -> List[ConfusionMatrixMetric]:
     """
-    Computes the miou for each type of class in the list of annotations.
+    Computes the confusion matrix metrics for each type of class in the list of annotations.
+    On the front end these will be displayed as precision, recall, and f1 scores.
 
     Args:
         ground_truth : Label containing human annotations or annotations known to be correct
         prediction: Label representing model predictions
-        include_subclasses (bool): Whether or not to include subclasses in the iou calculation.
+        include_subclasses (bool): Whether or not to include subclasses in the calculation.
             If set to True, the iou between two overlapping objects of the same type is 0 if the subclasses are not the same.
     Returns:
-        Returns a list of ScalarMetrics.
+        Returns a list of ConfusionMatrixMetrics.
         There will be one metric for each class in the union of ground truth and prediction classes.
     """
     # Classifications are supported because we just take a naive approach to them..
diff --git a/labelbox/data/metrics/iou/calculation.py b/labelbox/data/metrics/iou/calculation.py
@@ -1,17 +1,13 @@
-"""
-All intermediate functions required to create iou scores.
-These can be used in user workflows to create custom metrics.
-"""
-
-from labelbox.data.annotation_types.metrics.scalar import ScalarMetricValue
 from typing import List, Optional, Tuple, Union
-from shapely.geometry import Polygon
 from itertools import product
+
+from shapely.geometry import Polygon
 import numpy as np
+
+from ..processing import get_feature_pairs, get_identifying_key, has_no_annotations, has_no_matching_annotations
 from ...annotation_types import (ObjectAnnotation, ClassificationAnnotation,
                                  Mask, Geometry, Point, Line, Checklist, Text,
-                                 Radio)
-from ..processing import get_feature_pairs, get_identifying_key, has_no_annotations, has_no_matching_annotations
+                                 Radio, ScalarMetricValue)
 
 
 def miou(ground_truths: List[Union[ObjectAnnotation, ClassificationAnnotation]],
@@ -45,7 +41,7 @@ def feature_miou(ground_truths: List[Union[ObjectAnnotation,
                                          ClassificationAnnotation]],
                  include_subclasses: bool) -> Optional[ScalarMetricValue]:
     """
-    Computes iou score for all features with the same feature schema id.
+    Computes iou score for all features of the same class.
 
     Args:
         ground_truths: List of ground truth annotations with the same feature schema.