add support for media types in label exports

Matt Sokoloff · Matt Sokoloff · commit a3fa5af3ac0b · 2021-11-17T09:13:25.000-05:00
diff --git a/labelbox/data/serialization/labelbox_v1/classification.py b/labelbox/data/serialization/labelbox_v1/classification.py
@@ -9,24 +9,25 @@
 
 
 class LBV1ClassificationAnswer(LBV1Feature):
+
     def to_common(self) -> ClassificationAnswer:
         return ClassificationAnswer(feature_schema_id=self.schema_id,
-                  name=self.title,
-                  keyframe = self.keyframe,
-                  extra={
-                      'feature_id': self.feature_id,
-                      'value': self.value
-                  })
+                                    name=self.title,
+                                    keyframe=self.keyframe,
+                                    extra={
+                                        'feature_id': self.feature_id,
+                                        'value': self.value
+                                    })
 
     @classmethod
-    def from_common(cls, answer: ClassificationAnnotation) -> "LBV1ClassificationAnswer":
-        return cls(
-        schema_id=answer.feature_schema_id,
-        title=answer.name,
-        value=answer.extra.get('value'),
-        feature_id=answer.extra.get('feature_id'),
-        keyframe=answer.keyframe
-    )
+    def from_common(
+            cls,
+            answer: ClassificationAnnotation) -> "LBV1ClassificationAnswer":
+        return cls(schema_id=answer.feature_schema_id,
+                   title=answer.name,
+                   value=answer.extra.get('value'),
+                   feature_id=answer.extra.get('feature_id'),
+                   keyframe=answer.keyframe)
 
 
 class LBV1Radio(LBV1Feature):
@@ -47,9 +48,7 @@ class LBV1Checklist(LBV1Feature):
     answers: List[LBV1ClassificationAnswer]
 
     def to_common(self) -> Checklist:
-        return Checklist(answer=[
-            answer.to_common() for answer in self.answers
-        ])
+        return Checklist(answer=[answer.to_common() for answer in self.answers])
 
     @classmethod
     def from_common(cls, checklist: Checklist, feature_schema_id: Cuid,
@@ -66,9 +65,7 @@ class LBV1Dropdown(LBV1Feature):
     answer: List[LBV1ClassificationAnswer]
 
     def to_common(self) -> Dropdown:
-        return Dropdown(answer=[
-            answer.to_common() for answer in self.answer
-        ])
+        return Dropdown(answer=[answer.to_common() for answer in self.answer])
 
     @classmethod
     def from_common(cls, dropdown: Dropdown, feature_schema_id: Cuid,
diff --git a/labelbox/data/serialization/labelbox_v1/label.py b/labelbox/data/serialization/labelbox_v1/label.py
@@ -137,20 +137,17 @@ class LBV1Label(BaseModel):
     label_url: Optional[str] = Extra('View Label')
     has_open_issues: Optional[float] = Extra('Has Open Issues')
     skipped: Optional[bool] = Extra('Skipped')
+    media_type: Optional[str] = Extra('media_type')
 
     def to_common(self) -> Label:
         if isinstance(self.label, list):
             annotations = []
             for lbl in self.label:
                 annotations.extend(lbl.to_common())
-            data = VideoData(url=self.row_data,
-                             external_id=self.external_id,
-                             uid=self.data_row_id)
         else:
             annotations = self.label.to_common()
-            data = self._infer_media_type()
 
-        return Label(data=data,
+        return Label(data=self._data_row_to_common(),
                      uid=self.id,
                      annotations=annotations,
                      extra={
@@ -174,44 +171,49 @@ def from_common(cls, label: Label):
                          external_id=label.data.external_id,
                          **label.extra)
 
-    def _infer_media_type(self):
-        # Video annotations are formatted differently from text and images
-        # So we only need to differentiate those two
+    def _data_row_to_common(self) -> Union[ImageData, TextData, VideoData]:
+        # Use data row information to construct the appropriate annotatin type
         data_row_info = {
+            'url' if self._is_url() else 'text': self.row_data,
             'external_id': self.external_id,
             'uid': self.data_row_id
         }
 
+        self.media_type = self.media_type or self._infer_media_type()
+        media_mapping = {
+            'text': TextData,
+            'image': ImageData,
+            'video': VideoData
+        }
+        if self.media_type not in media_mapping:
+            raise ValueError(
+                f"Annotation types are only supported for {list(media_mapping)} media types."
+                f" Found {self.media_type}.")
+        return media_mapping[self.media_type](**data_row_info)
+
+    def _infer_media_type(self) -> str:
+        # Determines the data row type based on the label content
+        if isinstance(self.label, list):
+            return 'video'
         if self._has_text_annotations():
-            # If it has text annotations then it must be text
-            if self._is_url():
-                return TextData(url=self.row_data, **data_row_info)
-            else:
-                return TextData(text=self.row_data, **data_row_info)
+            return 'text'
         elif self._has_object_annotations():
-            # If it has object annotations and none are text annotations then it must be an image
-            if self._is_url():
-                return ImageData(url=self.row_data, **data_row_info)
-            else:
-                return ImageData(text=self.row_data, **data_row_info)
+            return 'image'
         else:
-            # no annotations to infer data type from.
-            # Use information from the row_data format if possible.
             if self._row_contains((".jpg", ".png", ".jpeg")) and self._is_url():
-                return ImageData(url=self.row_data, **data_row_info)
-            elif self._row_contains(
-                (".txt", ".text", ".html")) and self._is_url():
-                return TextData(url=self.row_data, **data_row_info)
-            elif not self._is_url():
-                return TextData(text=self.row_data, **data_row_info)
+                return 'image'
+            elif (self._row_contains((".txt", ".text", ".html")) and
+                  self._is_url()) or not self._is_url():
+                return 'text'
             else:
-                # This is going to be urls that do not contain any file extensions
-                # This will only occur on skipped images.
-                # To use this converter on data with this url format
-                #   filter out empty examples from the payload before deserializing.
+                #  This condition will occur when a data row url does not contain a file extension
+                #  and the label does not contain object annotations that indicate the media type.
+                #  As a temporary workaround you can explicitly set the media_type
+                #  in each label json payload before converting.
+                #  We will eventually provide the media type in the export.
                 raise TypeError(
-                    "Can't infer data type from row data. Remove empty examples before trying again. "
-                    f"row_data: {self.row_data[:200]}")
+                    "Can't infer data type from row data. row_data: {self.row_data[:200]}"
+                )
 
     def _has_object_annotations(self):
         return len(self.label.objects) > 0
diff --git a/tests/data/serialization/labelbox_v1/test_image.py b/tests/data/serialization/labelbox_v1/test_image.py
@@ -16,7 +16,11 @@ def test_image(file_path):
     collection = LBV1Converter.deserialize([payload])
     serialized = next(LBV1Converter.serialize(collection))
 
+    # We are storing the media types now.
+    payload['media_type'] = 'image'
+
     assert serialized.keys() == payload.keys()
+
     for key in serialized:
         if key != 'Label':
             assert serialized[key] == payload[key]
diff --git a/tests/data/serialization/labelbox_v1/test_text.py b/tests/data/serialization/labelbox_v1/test_text.py
@@ -9,6 +9,8 @@ def test_text():
     collection = LBV1Converter.deserialize([payload])
     serialized = next(LBV1Converter.serialize(collection))
 
+    payload['media_type'] = 'text'
+
     assert serialized.keys() == payload.keys()
     for key in serialized:
         if key != 'Label':
diff --git a/tests/data/serialization/labelbox_v1/test_video.py b/tests/data/serialization/labelbox_v1/test_video.py
@@ -17,7 +17,7 @@ def test_video():
         open('tests/data/assets/labelbox_v1/video_export.json', 'r'))
     collection = LBV1Converter.deserialize([payload])
     serialized = next(LBV1Converter.serialize(collection))
-
+    payload['media_type'] = 'video'
     assert serialized.keys() == payload.keys()
     for key in serialized:
         if key != 'Label':