Clean up some missing stuff and docstrings

Ubuntu · Ubuntu · commit 3ccf31ea05b9 · 2021-09-14T21:55:09.000Z
diff --git a/nucleus/__init__.py b/nucleus/__init__.py
@@ -1,54 +1,7 @@
 """
 Nucleus Python Library.
 
-Data formats used:
-
-_____________________________________________________________________________________________________
-
-DatasetItem
-
-image_url       |   str     |   The URL containing the image for the given row of data.\n
-reference_id    |   str     |   An optional user-specified identifier to reference this given image.\n
-metadata        |   dict    |   All of column definitions for this item.
-                |           |   The keys should match the user-specified column names,
-                |           |   and the corresponding values will populate the cell under the column.\n
-_____________________________________________________________________________________________________
-
-
-Box2DGeometry:
-
-x               |   float   |   The distance, in pixels, between the left border of the bounding box
-                |           |   and the left border of the image.\n
-y               |   float   |   The distance, in pixels, between the top border of the bounding box
-                |           |   and the top border of the image.\n
-width	        |   float   |   The width in pixels of the annotation.\n
-height	        |   float   |   The height in pixels of the annotation.\n
-
-Box2DAnnotation:
-
-item_id         |   str     |   The internally-controlled item identifier to associate this annotation with.
-                |           |   The reference_id field should be empty if this field is populated.\n
-reference_id    |   str     |   The user-specified reference identifier to associate this annotation with.\n
-                |           |   The item_id field should be empty if this field is populated.
-label	        |   str     |	The label for this annotation (e.g. car, pedestrian, bicycle).\n
-type	        |   str     |   The type of this annotation. It should always be the box string literal.\n
-geometry        |   dict    |   Representation of the bounding box in the Box2DGeometry format.\n
-metadata        |   dict    |   An arbitrary metadata blob for the annotation.\n
-
-_____________________________________________________________________________________________________
-
-Box2DDetection:
-
-item_id         |   str     |   The internally-controlled item identifier to associate this annotation with.
-                |           |   The reference_id field should be empty if this field is populated.\n
-reference_id    |   str     |   The user-specified reference identifier to associate this annotation with.
-                |           |   The item_id field should be empty if this field is populated.\n
-label	        |   str     |	The label for this annotation (e.g. car, pedestrian, bicycle).\n
-type	        |   str     |   The type of this annotation. It should always be the box string literal.\n
-confidence      |   float   |   The optional confidence level of this annotation.
-                |           |   It should be between 0 and 1 (inclusive).\n
-geometry        |   dict    |   Representation of the bounding box in the Box2DGeometry format.\n
-metadata        |   dict    |   An arbitrary metadata blob for the annotation.\n
+For full documentation see: https://dashboard.scale.com/nucleus/docs/api?language=python
 """
 import asyncio
 import json
@@ -244,11 +197,8 @@ def get_dataset_items(self, dataset_id) -> List[DatasetItem]:
             for item in dataset_items:
                 image_url = item.get("original_image_url")
                 metadata = item.get("metadata", None)
-                item_id = item.get("id", None)
                 ref_id = item.get("ref_id", None)
-                dataset_item = DatasetItem(
-                    image_url, ref_id, item_id, metadata
-                )
+                dataset_item = DatasetItem(image_url, ref_id, metadata)
                 constructed_dataset_items.append(dataset_item)
         elif error:
             raise DatasetItemRetrievalError(message=error)
@@ -349,26 +299,19 @@ def delete_dataset(self, dataset_id: str) -> dict:
         return self.make_request({}, f"dataset/{dataset_id}", requests.delete)
 
     @sanitize_string_args
-    def delete_dataset_item(
-        self, dataset_id: str, item_id: str = None, reference_id: str = None
-    ) -> dict:
+    def delete_dataset_item(self, dataset_id: str, reference_id) -> dict:
         """
         Deletes a private dataset based on datasetId.
         Returns an empty payload where response status `200` indicates
         the dataset has been successfully deleted.
         :param payload: { "name": str }
         :return: { "dataset_id": str, "name": str }
         """
-        if item_id:
-            return self.make_request(
-                {}, f"dataset/{dataset_id}/{item_id}", requests.delete
-            )
-        else:  # Assume reference_id is provided
-            return self.make_request(
-                {},
-                f"dataset/{dataset_id}/refloc/{reference_id}",
-                requests.delete,
-            )
+        return self.make_request(
+            {},
+            f"dataset/{dataset_id}/refloc/{reference_id}",
+            requests.delete,
+        )
 
     def populate_dataset(
         self,
@@ -1015,17 +958,13 @@ def create_slice(self, dataset_id: str, payload: dict) -> Slice:
         as a means of identifying items in the dataset.
 
         "name" -- The human-readable name of the slice.
-
-        "dataset_item_ids" -- An optional list of dataset item ids for the items in the slice
-
         "reference_ids" -- An optional list of user-specified identifier for the items in the slice
 
         :param
         dataset_id: id of the dataset
         payload:
         {
             "name": str,
-            "dataset_item_ids": List[str],
             "reference_ids": List[str],
         }
         :return: new Slice object
@@ -1051,14 +990,12 @@ def slice_info(self, slice_id: str) -> dict:
 
         :param
         slice_id: id of the slice
-        id_type: the type of IDs you want in response (either "reference_id" or "dataset_item_id")
-        to identify the DatasetItems
 
         :return:
         {
             "name": str,
             "dataset_id": str,
-            "dataset_item_ids": List[str],
+            "reference_ids": List[str],
         }
         """
         response = self.make_request(
@@ -1118,7 +1055,6 @@ def append_to_slice(
         as a means of identifying items in the dataset.
 
         :param
-        dataset_item_ids: List[str],
         reference_ids: List[str],
 
         :return:
@@ -1182,7 +1118,7 @@ def create_custom_index(
 
         :param
         dataset_id: id of dataset that the custom index is being added to.
-        embeddings_urls: list of urls, each of which being a json mapping dataset_item_id -> embedding vector
+        embeddings_urls: list of urls, each of which being a json mapping reference_id -> embedding vector
         embedding_dim: the dimension of the embedding vectors, must be consistent for all embedding vectors in the index.
         """
         return self.make_request(
diff --git a/nucleus/dataset.py b/nucleus/dataset.py
@@ -360,22 +360,17 @@ def create_slice(
         as a means of identifying items in the dataset.
 
         :param name: The human-readable name of the slice.
-        :param dataset_item_ids: An optional list of dataset item ids for the items in the slice
-        :param reference_ids: An optional list of user-specified identifier for the items in the slice
+        :param reference_ids: A list of user-specified identifier for the items in the slice
 
         :return: new Slice object
         """
         return self._client.create_slice(
             self.id, {NAME_KEY: name, REFERENCE_IDS_KEY: reference_ids}
         )
 
-    def delete_item(self, item_id: str = None, reference_id: str = None):
-        if bool(item_id) == bool(reference_id):
-            raise Exception(
-                "You must specify either a reference_id or an item_id for a DatasetItem."
-            )
+    def delete_item(self, reference_id: str):
         return self._client.delete_dataset_item(
-            self.id, reference_id=reference_id, item_id=item_id
+            self.id, reference_id=reference_id
         )
 
     def list_autotags(self):
diff --git a/nucleus/slice.py b/nucleus/slice.py
@@ -62,7 +62,6 @@ def append(
         as a means of identifying items in the dataset.
 
         :param
-        dataset_item_ids: List[str],
         reference_ids: List[str],
 
         :return: