huggingface userguide (#84)

z7ye · web-flow · commit 692b45dbeab0 · 2023-03-01T17:44:41.000-08:00
diff --git a/docs/source/ads.model.framework.rst b/docs/source/ads.model.framework.rst
@@ -60,6 +60,14 @@ ads.model.framework.xgboost\_model module
    :undoc-members:
    :show-inheritance:
 
+ads.model.framework.huggingface\_model module
+-----------------------------------------
+
+.. automodule:: ads.model.framework.huggingface_model
+   :members:
+   :undoc-members:
+   :show-inheritance:
+
 Module contents
 ---------------
 
diff --git a/docs/source/user_guide/model_registration/framework_specific_instruction.rst b/docs/source/user_guide/model_registration/framework_specific_instruction.rst
@@ -9,6 +9,7 @@
     frameworks/sparkpipelinemodel
     frameworks/lightgbmmodel
     frameworks/xgboostmodel
+    frameworks/huggingfacemodel
     frameworks/automlmodel
     frameworks/genericmodel
-    
+
diff --git a/docs/source/user_guide/model_registration/frameworks/huggingfacemodel.rst b/docs/source/user_guide/model_registration/frameworks/huggingfacemodel.rst
@@ -0,0 +1,242 @@
+.. HuggingFacePipelineModel:
+
+HuggingFacePipelineModel
+************************
+
+.. versionadded:: 2.8.2
+
+See `API Documentation <../../../ads.model_framework.html#ads.model.framework.huggingface_model.HuggingFacePipelineModel>`__
+
+Overview
+========
+
+The ``ads.model.framework.huggingface_model.HuggingFacePipelineModel`` class in ADS is designed to allow you to rapidly get a HuggingFace pipelines into production. The ``.prepare()`` method creates the model artifacts that are needed to deploy a functioning pipeline without you having to configure it or write code. However, you can customize the required ``score.py`` file.
+
+.. include:: ../_template/overview.rst
+
+The following steps take your trained ``HuggingFacePipelineModel`` model and deploy it into production with a few lines of code.
+
+**Create a HuggingFace Pipeline**
+
+Load a `ImageSegmentationPipeline <https://huggingface.co/docs/transformers/main_classes/pipelines#transformers.ImageSegmentationPipeline>`_ pretrained model.
+
+.. code-block:: python3
+
+    >>> from transformers import pipeline
+
+    >>> segmenter = pipeline(task="image-segmentation", model="facebook/detr-resnet-50-panoptic", revision="fc15262")
+    >>> preds = segmenter(
+    ...     "https://huggingface.co/datasets/huggingface/documentation-images/resolve/main/pipeline-cat-chonk.jpeg"
+    ... )
+    >>> preds
+    [{'score': 0.987885,
+        'label': 'LABEL_184',
+        'mask': <PIL.Image.Image image mode=L size=960x686>},
+        {'score': 0.997345,
+        'label': 'snow',
+        'mask': <PIL.Image.Image image mode=L size=960x686>},
+        {'score': 0.997247,
+        'label': 'cat',
+        'mask': <PIL.Image.Image image mode=L size=960x686>}]
+
+Prepare Model Artifact
+======================
+
+.. code-block:: python3
+
+    >>> from ads.common.model_metadata import UseCaseType
+    >>> from ads.model import HuggingFacePipelineModel
+
+    >>> import tempfile
+
+    >>> # Prepare the model
+    >>> artifact_dir = "huggingface_pipeline_model_artifact"
+    >>> huggingface_pipeline_model = HuggingFacePipelineModel(model, artifact_dir=artifact_dir)
+    >>> huggingface_pipeline_model.prepare(
+    ...    inference_conda_env="<your-conda-pack-path>",
+    ...    inference_python_version="<your-python-version>",
+    ...    training_conda_env="<your-conda-pack-path>",
+    ...    use_case_type=UseCaseType.OTHER,
+    ...    force_overwrite=True,
+    ...)
+    # You don't need to modify the score.py generated. The model can be loaded by the transformers.pipeline.
+    # More info here - https://huggingface.co/docs/transformers/main_classes/pipelines#transformers.pipeline
+
+
+Instantiate a ``HuggingFacePipelineModel()`` object with HuggingFace pipelines. All the pipelines related files are saved under the ``artifact_dir``.
+
+For more detailed information on what parameters that ``HuggingFacePipelineModel`` takes, refer to the `API Documentation <../../../ads.model_framework.html#ads.model.framework.huggingface_model.HuggingFacePipelineModel>`__
+
+
+
+Summary Status
+==============
+
+.. include:: ../_template/summary_status.rst
+
+.. figure:: ../figures/summary_status.png
+   :align: center
+
+Register Model
+==============
+
+.. code-block:: python3
+
+    >>> # Register the model
+    >>> model_id = huggingface_pipeline_model.save()
+
+    Model is successfully loaded.
+    ['.model-ignore', 'score.py', 'config.json', 'runtime.yaml', 'preprocessor_config.json', 'pytorch_model.bin']
+
+    'ocid1.datasciencemodel.oc1.xxx.xxxxx'
+
+Deploy and Generate Endpoint
+============================
+
+.. code-block:: python3
+
+    >>> # Deploy and create an endpoint for the huggingface_pipeline_model 
+    >>> huggingface_pipeline_model.deploy(
+    ...     display_name="HuggingFace Pipeline Model For Image Segmentation",
+    ...     deployment_log_group_id="ocid1.loggroup.oc1.xxx.xxxxx",
+    ...     deployment_access_log_id="ocid1.log.oc1.xxx.xxxxx",
+    ...     deployment_predict_log_id="ocid1.log.oc1.xxx.xxxxx",
+    ... )
+    >>> print(f"Endpoint: {huggingface_pipeline_model.model_deployment.url}")
+
+Run Prediction against Endpoint
+===============================
+
+.. code-block:: python3
+
+    >>> # Download an image
+    >>> import PIL.Image
+    >>> import requests
+    >>> import cloudpickle
+    >>> image_url = "https://huggingface.co/datasets/huggingface/documentation-images/resolve/main/pipeline-cat-chonk.jpeg"
+    >>> image = PIL.Image.open(requests.get(image_url, stream=True).raw)
+
+    >>> # Generate prediction by invoking the deployed endpoint
+    >>> preds = huggingface_pipeline_model.predict(image)["prediction"]
+    >>> print([{"score": round(pred["score"], 4), "label": pred["label"]} for pred in preds['prediction']])
+    [{'score': 0.9879, 'label': 'LABEL_184'},
+    {'score': 0.9973, 'label': 'snow'},
+    {'score': 0.9972, 'label': 'cat'}]
+
+
+Predict with Image
+------------------
+
+Predict Image by passing a PIL.Image.Image object using the ``data`` argument in ``predict()`` to predict a single image.
+The image will be converted to bytes using cloudpickle so it can be passed to the endpoint.
+It will be loaded back to PIL.Image.Image in ``score.py`` before pass into the pipeline.
+
+.. note::
+    - The payload size limit is 10 MB. Read more about invoking a model deployment `here <https://docs.oracle.com/iaas/data-science/using/model-dep-invoke.htm#model_dep_invoke>`_.
+    - Model deployment currently does not support internet(coming soon), hence you cannot pass in a url.
+
+Predict with Multiple Arguments
+-------------------------------
+
+If your model takes more than one argument, you can pass in through dictionary with the keys as the argument name and values as the value of the arguement.
+
+.. code-block:: python3
+
+    >>> your_huggingface_pipeline_model.verify({"parameter_name_1": "parameter_value_1", ..., "parameter_name_n": "parameter_value_n"})
+    >>> your_huggingface_pipeline_model.predict({"parameter_name_1": "parameter_value_1", ..., "parameter_name_n": "parameter_value_n"})
+
+
+Run Prediction with oci sdk
+==============================
+
+Model deployment endpoints can be invoked with the oci sdk. This example invokes a model deployment with the oci sdk with a ``bytes`` payload:
+
+``bytes`` payload example
+------------------------------
+
+.. code-block:: python3
+
+    >>> # The OCI SDK must be installed for this example to function properly.
+    >>> # Installation instructions can be found here: https://docs.oracle.com/en-us/iaas/Content/API/SDKDocs/pythonsdk.htm
+
+    >>> import requests
+    >>> import oci
+    >>> from ads.common.auth import default_signer
+    >>> import cloudpickle
+    >>> import PIL.Image
+    >>> import cloudpickle
+    >>> headers = {"Content-Type": "application/octet-stream"} 
+    >>> endpoint = huggingface_pipeline_model.model_deployment.url + "/predict"
+
+    >>> ## download the image
+    >>> image_url = "https://huggingface.co/datasets/Narsil/image_dummy/raw/main/parrots.png"
+    >>> image = PIL.Image.open(requests.get(image_link, stream=True).raw)
+    >>> image_bytes = cloudpickle.dumps(image)
+
+    >>> preds = requests.post(endpoint, data=image_bytes, auth=default_signer()['signer'], headers=headers).json()
+    >>> print([{"score": round(pred["score"], 4), "label": pred["label"]} for pred in preds['prediction']])
+    [{'score': 0.9879, 'label': 'LABEL_184'},
+    {'score': 0.9973, 'label': 'snow'},
+    {'score': 0.9972, 'label': 'cat'}]
+
+
+Example
+=======
+
+.. code-block:: python3
+
+    from transformers import pipeline
+    from ads.model import HuggingFacePipelineModel
+
+    import tempfile
+    import PIL.Image
+    from ads.common.auth import default_signer
+    import requests
+    import cloudpickle
+
+    ## download the image
+    image_url = "https://huggingface.co/datasets/Narsil/image_dummy/raw/main/parrots.png"
+    image = PIL.Image.open(requests.get(image_link, stream=True).raw)
+
+    ## download the pretrained model
+    classifier = pipeline(model="openai/clip-vit-large-patch14")
+    classifier(
+            images=image,
+            candidate_labels=["animals", "humans", "landscape"],
+        )
+
+    ## Initiate a HuggingFacePipelineModel instance
+    zero_shot_image_classification_model = HuggingFacePipelineModel(classifier, artifact_dir=empfile.mkdtemp())
+
+    # Autogenerate score.py, serialized model, runtime.yaml
+    conda_pack_path = "oci://bucket@namespace/path/to/conda/pack"
+    python_version = "3.x" # Remember to update 3.x with your actual python version, e.g. 3.8
+    zero_shot_image_classification_model.prepare(inference_conda_env=conda_pack_path, inference_python_version = python_version, force_overwrite=True)
+
+    ## Convert payload to bytes
+    data = {"images": image, "candidate_labels": ["animals", "humans", "landscape"]}
+    body = cloudpickle.dumps(data) # convert image to bytes
+
+    # Verify generated artifacts
+    zero_shot_image_classification_model.verify(data=data)
+    zero_shot_image_classification_model.verify(data=body)
+
+    # Register HuggingFace Pipeline model
+    zero_shot_image_classification_model.save()
+
+    ## Deploy
+    log_group_id = "<log_group_id>"
+    log_id = "<log_id>"
+    zero_shot_image_classification_model.deploy(deployment_bandwidth_mbps=100,
+                    wait_for_completion=False,
+                    deployment_log_group_id = log_group_id,
+                    deployment_access_log_id = log_id,
+                    deployment_predict_log_id = log_id)
+    zero_shot_image_classification_model.predict(image)
+    zero_shot_image_classification_model.predict(body)
+
+    ### Invoke the model by sending bytes
+    auth = default_signer()['signer']
+    endpoint = zero_shot_image_classification_model.model_deployment.url + "/predict"
+    headers = {"Content-Type": "application/octet-stream"}
+    requests.post(endpoint, data=body, auth=auth, headers=headers).json()
diff --git a/docs/source/user_guide/model_registration/frameworks/pytorchmodel.rst b/docs/source/user_guide/model_registration/frameworks/pytorchmodel.rst
@@ -215,7 +215,7 @@ Deploy and Generate Endpoint
 
 .. code-block:: python3
 
-    >>> # Deploy and create an endpoint for the TensorFlow model
+    >>> # Deploy and create an endpoint for the PyTorch model
     >>> pytorch_model.deploy(
             display_name="PyTorch Model For Classification",
             deployment_log_group_id="ocid1.loggroup.oc1.xxx.xxxxx",
diff --git a/docs/source/user_guide/model_registration/quick_start.rst b/docs/source/user_guide/model_registration/quick_start.rst
diff --git a/docs/source/user_guide/model_serialization/index.rst b/docs/source/user_guide/model_serialization/index.rst