Merge pull request #375 from Labelbox/gj/video-mal

Gareth · web-flow · commit 3385dce391e1 · 2022-01-06T12:29:56.000-08:00
diff --git a/examples/model_assisted_labeling/image_mal.ipynb b/examples/model_assisted_labeling/image_mal.ipynb
@@ -23,13 +23,7 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "!pip install labelbox\n",
-    "!pip install requests\n",
-    "!pip install ndjson\n",
-    "!pip install scikit-image\n",
-    "!pip install PILLOW\n",
-    "!pip install tensorflow\n",
-    "!pip install opencv-python"
+    "!pip install -q labelbox requests ndjson scikit-image PILLOW tensorflow opencv-python"
    ]
   },
   {
@@ -534,7 +528,7 @@
  ],
  "metadata": {
   "kernelspec": {
-   "display_name": "Python 3",
+   "display_name": "Python 3 (ipykernel)",
    "language": "python",
    "name": "python3"
   },
@@ -548,9 +542,9 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.8.8"
+   "version": "3.8.2"
   }
  },
  "nbformat": 4,
  "nbformat_minor": 5
-}
+}
diff --git a/examples/model_assisted_labeling/video_mal.ipynb b/examples/model_assisted_labeling/video_mal.ipynb
@@ -0,0 +1,339 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "stupid-court",
+   "metadata": {},
+   "source": [
+    "# Video MAL"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "intellectual-idaho",
+   "metadata": {},
+   "source": [
+    "* Upload model inferences for video tasks\n",
+    "* Support types\n",
+    "    * bounding box"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "voluntary-minister",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "!pip install -q labelbox"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "id": "committed-richards",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import os\n",
+    "import uuid\n",
+    "from io import BytesIO\n",
+    "from typing import Dict, Any, Tuple\n",
+    "\n",
+    "from labelbox import Client, LabelingFrontend\n",
+    "from labelbox.schema.ontology import OntologyBuilder, Tool, Classification, Option"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "id": "thirty-grocery",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "API_KEY = os.environ.get(\"LABELBOX_API_KEY\")\n",
+    "if not API_KEY:\n",
+    "    raise EnvironmentError(\"Missing API Key\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "id": "conservative-marsh",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Only update this if you have an on-prem deployment\n",
+    "ENDPOINT = \"https://api.labelbox.com/graphql\""
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "id": "affecting-myanmar",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "client = Client(\n",
+    "    api_key=API_KEY,\n",
+    "    endpoint=ENDPOINT\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "blessed-venture",
+   "metadata": {},
+   "source": [
+    "### Project Setup"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "id": "suburban-crowd",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# We want to try out a few different tools here.\n",
+    "ontology_builder = OntologyBuilder(\n",
+    "    tools=[\n",
+    "        Tool(tool=Tool.Type.BBOX, name=\"jellyfish\")\n",
+    "    ]\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "id": "modern-program",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Lets setup a project to label\n",
+    "# Note see Ontology, Project, and Project_setup notebooks for more information on this section.\n",
+    "project = client.create_project(name=\"video_mal_project\")\n",
+    "dataset = client.create_dataset(name=\"video_mal_dataset\")\n",
+    "dataset.create_data_row(\n",
+    "    row_data=\"https://storage.labelbox.com/cjhfn5y6s0pk507024nz1ocys%2Fb8837f3b-b071-98d9-645e-2e2c0302393b-jellyfish2-100-110.mp4\")\n",
+    "editor = next(\n",
+    "    client.get_labeling_frontends(where=LabelingFrontend.name == \"Editor\")\n",
+    ")\n",
+    "project.setup(editor, ontology_builder.asdict())\n",
+    "project.datasets.connect(dataset)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "portable-grenada",
+   "metadata": {},
+   "source": [
+    "#### Grab featureSchemaIds"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "id": "abstract-fifteen",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "{'jellyfish': 'cky3dt2lja37d0z9t26wf3qo5'}\n"
+     ]
+    }
+   ],
+   "source": [
+    "# When we created a project with the ontology defined above, all of the ids were assigned.\n",
+    "# So lets reconstruct the ontology builder with all of the ids.\n",
+    "ontology = ontology_builder.from_project(project)\n",
+    "# We want all of the feature schemas to be easily accessible by name.\n",
+    "schema_lookup = {tool.name: tool.feature_schema_id for tool in ontology.tools}\n",
+    "print(schema_lookup)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "portuguese-arthur",
+   "metadata": {},
+   "source": [
+    "## Import Format\n",
+    "\n",
+    "* [Documentation](https://docs.labelbox.com/docs/bounding-box-json)\n",
+    "\n",
+    "\n",
+    "```\n",
+    "Each row of the import is a unique instance\n",
+    "\n",
+    "schemaId: <featureSchemaId>\n",
+    "dataRow:\n",
+    "    id: <dataRowId>\n",
+    "Instance:\n",
+    "    [Segments]:\n",
+    "        [KeyFrames]:\n",
+    "            frame:\n",
+    "            bbox:\n",
+    "                top:\n",
+    "                bottom:\n",
+    "                height:\n",
+    "                width:\n",
+    "```\n",
+    "\n",
+    "**segments**: A segment represents a continuous section where an object is visible. If an instance disappears then the segment ends. If it re-appears, a new segment is created.\n",
+    "\n",
+    "**keyframes**: Key frames identify the location of an instance. Between keyframes, the location of the instance is interpolated.\n",
+    "\n",
+    "**bbox**: The coordinates of the bounding box"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "id": "5fc417c5",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "segments = [\n",
+    "    {\n",
+    "        \"keyframes\": [\n",
+    "            {\n",
+    "                \"frame\": 1,\n",
+    "                \"bbox\": {\n",
+    "                    \"top\": 80,\n",
+    "                    \"left\": 80,\n",
+    "                    \"height\": 80,\n",
+    "                    \"width\": 80\n",
+    "                }\n",
+    "            },\n",
+    "            {\n",
+    "                \"frame\": 20,\n",
+    "                \"bbox\": {\n",
+    "                    \"top\": 125,\n",
+    "                    \"left\": 125,\n",
+    "                    \"height\": 200,\n",
+    "                    \"width\": 300\n",
+    "                }\n",
+    "            }\n",
+    "        ]\n",
+    "    },\n",
+    "    {\n",
+    "        \"keyframes\": [\n",
+    "            {\n",
+    "                \"frame\": 27,\n",
+    "                \"bbox\": {\n",
+    "                    \"top\": 80,\n",
+    "                    \"left\": 50,\n",
+    "                    \"height\": 80,\n",
+    "                    \"width\": 50\n",
+    "                }\n",
+    "            }\n",
+    "        ]\n",
+    "    }\n",
+    "]"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "convertible-entry",
+   "metadata": {},
+   "source": [
+    "##### Create helper functions to make this much easier"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 12,
+   "id": "developing-beauty",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def create_video_bbox_ndjson(datarow_id: str, schema_id: str, segments: Dict[str, Any]) -> Dict[str, Any]:\n",
+    "    return {\n",
+    "        \"uuid\": str(uuid.uuid4()),\n",
+    "        \"schemaId\": schema_id,\n",
+    "        \"dataRow\": {\"id\": datarow_id},\n",
+    "        \"segments\": segments\n",
+    "    }"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 13,
+   "id": "asian-savings",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "uploads = []\n",
+    "\n",
+    "for data_row in dataset.data_rows():\n",
+    "    uploads.append(create_video_bbox_ndjson(data_row.uid, schema_lookup['jellyfish'], segments))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "perfect-seafood",
+   "metadata": {},
+   "source": [
+    "### Upload the annotations"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 14,
+   "id": "entire-community",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Let's upload!\n",
+    "# Validate must be set to false for video bounding boxes\n",
+    "upload_task = project.upload_annotations(name=f\"upload-job-{uuid.uuid4()}\",\n",
+    "                                         annotations=uploads,\n",
+    "                                         validate=False)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 15,
+   "id": "hollywood-faculty",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "[]\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Wait for upload to finish (Will take up to five minutes)\n",
+    "upload_task.wait_until_done()\n",
+    "# Review the upload status\n",
+    "print(upload_task.errors)"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.8.2"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}