review + tests

jihan-yin · jihan-yin · commit e8a5098ead08 · 2021-09-16T13:46:36.000-07:00
diff --git a/nucleus/constants.py b/nucleus/constants.py
@@ -63,8 +63,7 @@
 MODEL_RUN_ID_KEY = "model_run_id"
 NAME_KEY = "name"
 NEW_ITEMS = "new_items"
-NUCLEUS_ENDPOINT = "https://jihan-yin-api.devbox.internal.scale.com/v1/nucleus"
-# NUCLEUS_ENDPOINT = "https://api.scale.com/v1/nucleus"
+NUCLEUS_ENDPOINT = "https://api.scale.com/v1/nucleus"
 NUM_SENSORS_KEY = "num_sensors"
 ORIGINAL_IMAGE_URL_KEY = "original_image_url"
 POINTCLOUD_KEY = "pointcloud"
diff --git a/nucleus/dataset.py b/nucleus/dataset.py
@@ -92,8 +92,18 @@ def autotag_items(self, autotag_name, for_scores_greater_than=0):
 
         :return: dictionary of the form
             {
-                'autotagItems': AutotagItem[],
-                'autotag': Autotag
+                'autotagItems': {
+                    ref_id: str,
+                    score: float,
+                    model_prediction_id: str | None
+                    ground_truth_annotation_id: str | None,
+                }[],
+                'autotag': {
+                    id: str,
+                    name: str,
+                    status: 'started' | 'completed',
+                    autotag_level: 'Image' | 'Object'
+                }
             }
         See https://dashboard.nucleus.scale.com/nucleus/docs/api#export-autotag-items for more details on the return types.
         """
@@ -109,8 +119,17 @@ def autotag_training_items(self, autotag_name):
 
         :return: dictionary of the form
             {
-                'autotagTrainingItems': AutotagTrainingItem[],
-                'autotag': Autotag
+                'autotagPositiveTrainingItems': {
+                    ref_id: str,
+                    model_prediction_id: str | None,
+                    ground_truth_annotation_id: str | None,
+                }[],
+                'autotag': {
+                    id: str,
+                    name: str,
+                    status: 'started' | 'completed',
+                    autotag_level: 'Image' | 'Object'
+                }
             }
         See https://dashboard.nucleus.scale.com/nucleus/docs/api#export-autotag-training-items for more details on the return types.
         """
diff --git a/tests/test_dataset.py b/tests/test_dataset.py
@@ -329,7 +329,7 @@ def test_raises_error_for_duplicate():
     )
 
 
-def test_dataset_export_autotag_scores(CLIENT):
+def test_dataset_export_autotag_tagged_items(CLIENT):
     # This test can only run for the test user who has an indexed dataset.
     # TODO: if/when we can create autotags via api, create one instead.
     if NUCLEUS_PYTEST_USER_ID in CLIENT.api_key:
@@ -342,11 +342,51 @@ def test_dataset_export_autotag_scores(CLIENT):
             in str(api_error.value)
         )
 
-        scores = dataset.autotag_scores(autotag_name="PytestTestTag")
+        items = dataset.autotag_items(autotag_name="PytestTestTag")
 
-        for column in ["dataset_item_ids", "ref_ids", "scores"]:
-            assert column in scores
-            assert len(scores[column]) > 0
+        assert "autotagItems" in items
+        assert "autotag" in items
+
+        autotagItems = items["autotagItems"]
+        autotag = items["autotag"]
+
+        assert len(autotagItems) > 0
+        for item in autotagItems:
+            for column in ["ref_id", "score"]:
+                assert column in item
+
+        for column in ["id", "name", "status", "autotag_level"]:
+            assert column in autotag
+
+
+def test_dataset_export_autotag_training_items(CLIENT):
+    # This test can only run for the test user who has an indexed dataset.
+    # TODO: if/when we can create autotags via api, create one instead.
+    if NUCLEUS_PYTEST_USER_ID in CLIENT.api_key:
+        dataset = CLIENT.get_dataset(DATASET_WITH_AUTOTAG)
+
+        with pytest.raises(NucleusAPIError) as api_error:
+            dataset.autotag_scores(autotag_name="NONSENSE_GARBAGE")
+        assert (
+            f"The autotag NONSENSE_GARBAGE was not found in dataset {DATASET_WITH_AUTOTAG}"
+            in str(api_error.value)
+        )
+
+        items = dataset.autotag_training_items(autotag_name="PytestTestTag")
+
+        assert "autotagItems" in items
+        assert "autotag" in items
+
+        autotagTrainingItems = items["autotagPositiveTrainingItems"]
+        autotag = items["autotag"]
+
+        assert len(autotagTrainingItems) > 0
+        for item in autotagTrainingItems:
+            for column in ["ref_id"]:
+                assert column in item
+
+        for column in ["id", "name", "status", "autotag_level"]:
+            assert column in autotag
 
 
 @pytest.mark.integration