Add the model authentication example

besirkurtulmus · besirkurtulmus · commit 34dcee520f17 · 2019-12-16T13:50:11.000-08:00
diff --git a/model_authentication/deploy.py b/model_authentication/deploy.py
@@ -0,0 +1,171 @@
+import Algorithmia
+import argparse
+from retry import retry
+from Algorithmia.errors import AlgorithmException
+
+def parse_arguments():
+    parser = argparse.ArgumentParser()
+    parser.add_argument("-k", "--api_key", nargs="?")
+    parser.add_argument("-u", "--username", nargs="?")
+    parser.add_argument("-a", "--algoname", nargs="?")
+    parser.add_argument("-m", "--model_script", nargs="?")
+    parser.add_argument("-d", "--model_dependency_file", nargs="?")
+    parser.add_argument("-p", "--data_path", nargs="?", default=".my/mycollection")
+    parser.add_argument("-c", "--model_checksum", nargs="?")
+    
+    args = parser.parse_args()
+    return args
+
+def main(args=None):
+    if isinstance(args, type(None)):
+        args = parse_arguments()
+        deploy(args)
+
+def deploy(args):
+    # A data collection, where we'll be storing our files
+    data_path = "data://{}".format(args.data_path)
+
+    # Create a new algorithmia client
+    client = Algorithmia.client(args.api_key)
+
+    # Create data collection if it doesn't exist
+    if not client.dir(data_path).exists():
+        client.dir(data_path).create()
+
+    ### 3. Upload model file ###
+
+    # Define local work directory
+    local_dir = "algo"
+    
+    model_name = "model.h5"
+    local_model = "{}/{}".format(local_dir, model_name)
+    data_model = "{}/{}".format(data_path, model_name)
+
+    # Upload our model file to our data collection
+    _ = client.file(data_model).putFile(local_model)
+    
+    ### 4. Create new algorithm ###
+
+    # Algorithms are refered with the following schema: username/algoname
+    algo_namespace = "{}/{}".format(args.username, args.algoname)
+
+    # Here are some details you can define for your algorithm
+    details = {
+        "summary": "This algorithm classifies 28x28 MNSIT images.",
+        "label": "MNIST Classifier",
+        "tagline": "mnist_classifier"
+    }
+
+    # 1. We're making our algorithm closed-sourced – "source_visibility"
+    # 
+    # 2. We're selecting a package set that has tensorflow-gpu already installed. – "package_set"
+    #    Even though we could manually install it later, using the optimized
+    #    & pre-installed image allows you to compile things faster.
+    # 
+    # 3. We're selectig the Algorithmia Platform License (aka. "apl"). – "license"
+    # 
+    # 4. We're giving our algorithm internet access. – "network_access"
+    # 
+    # 5. We're allowing our algorithm to call other algorithms. – "pipeline_enabled"
+    settings = {
+        "source_visibility": "closed",
+        "package_set": "tensorflow-gpu-2.0",
+        "license": "apl",
+        "network_access": "full",
+        "pipeline_enabled": True
+    }
+
+    # Let's also provide a sample input for our algorithm
+    version_info = {
+        "sample_input": '[[0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]]'
+    }
+
+    print("Algorithm namepace: {}".format(algo_namespace))
+
+    # Create a new algorithm
+    client.algo(algo_namespace).create(details, settings, version_info)
+
+    # Print the URL to the algorithm
+    print("Algorithm URL: https://algorithmia.com/algorithms/{}".format(algo_namespace))
+
+    ### 5. Git clone our algorithm locally  ###
+
+    import urllib.parse
+    from git import Git, Repo, remote
+
+    # Encode API key, so we can use it in the git URL
+    encoded_api_key= urllib.parse.quote_plus(args.api_key)
+
+    algo_repo = "https://{}:{}@git.algorithmia.com/git/{}/{}.git".format(args.username, encoded_api_key, args.username, args.algoname)
+
+    _ = Repo.clone_from(algo_repo, "{}/{}".format(local_dir, args.algoname))
+
+    cloned_repo = Repo("{}/{}".format(local_dir, args.algoname))
+
+    ### 6. The algorithm script & dependency file ###
+
+    algo_script_path = "{}/{}/src/{}.py".format(local_dir, args.algoname, args.algoname)
+    dependency_file_path = "{}/{}/{}".format(local_dir, args.algoname, "requirements.txt")
+
+    # shutil.copyfile(args.model_script, algo_script_path)
+    # Modify & copy over the script file
+    with open(args.model_script) as f:
+        content = f.read()
+        newText=content.replace('<MODEL_FILE_CHECKSUM>', args.model_checksum)\
+        .replace('<DATA_DIR>', args.data_path)
+
+    with open(algo_script_path, "w") as f:
+        f.write(newText)
+    
+    shutil.copyfile(args.model_dependency_file, dependency_file_path)
+
+    ### 7. Upload our source code ###
+    
+    files = ["src/{}.py".format(args.algoname), "requirements.txt"]
+    cloned_repo.index.add(files)
+
+    cloned_repo.index.commit("Add algorithm files")
+
+    origin = cloned_repo.remote(name='origin')
+    
+    print("Pushing source code upstream, uploading model file & compiling algorithm...")
+    
+    _ = origin.push()
+
+    # Print the URL to the algorithm source code
+    print("Algorithm Source Code is available at: https://algorithmia.com/algorithms/{}/source".format(algo_namespace))
+
+    ### 8. Call & test our algorithm ###
+    
+    print("Testing new compiled algorithm via API endpoint...")
+    latest_hash = client.algo(algo_namespace).info().version_info.git_hash
+
+    # Call algorithm until the algo hash endpoint becomes available, up to 10 seconds
+    @retry(AlgorithmException, tries=20, delay=1)
+    def get_probability(ALGO, VERSION, INPUT):
+        return client.algo("{}/{}".format(ALGO, VERSION)).pipe(INPUT).result["prob"]
+    
+    # Let's create a 28x28 array as an input
+    algo_input = [[0]*28]*28
+
+    # Call the algorithm endpoint with the latest hash
+    prob = get_probability(algo_namespace, latest_hash, algo_input)
+
+    print("Test complete!")
+
+    ### 9. Publish our algorithm ###
+    
+    print("Publishing and deploying algorithm...")
+
+    # Now let's publish/deploy our algorithm
+    client.algo(algo_namespace).publish()
+
+    latest_version = client.algo(algo_namespace).info().version_info.semantic_version
+
+    # Call the algorithm endpoint with the latest version
+    prob = get_probability(algo_namespace, latest_version, algo_input)
+
+    print("Algorithm has been deployed!")
+
+if __name__ == "__main__":
+    main()
diff --git a/model_authentication/model.py b/model_authentication/model.py
@@ -0,0 +1,52 @@
+import Algorithmia
+from tensorflow import keras
+import numpy as np
+import pickle
+import hashlib
+
+def sha256_checksum(filename, block_size=65536):
+    # Let's read in 64KB chunks
+    sha256 = hashlib.sha256()
+    with open(filename, "rb") as f:
+        for block in iter(lambda: f.read(block_size), b""):
+            sha256.update(block)
+    return sha256.hexdigest()
+
+def authenticate_model(model_file, checksum):
+    print("Asserting {}=={}".format(sha256_checksum(model_file), checksum))
+    assert(sha256_checksum(model_file)==checksum)
+
+# Create our Algorithmia client
+client = Algorithmia.client()
+
+# Our model file checksum
+model_file_checksum = "<MODEL_FILE_CHECKSUM>"
+
+# Define where our model file lives in our data collection
+data_model = "data://<DATA_DIR>/model.h5"
+
+# Download & initialize our model
+model_file = client.file(data_model).getFile().name
+
+# Authenticate model file before doing anything
+authenticate_model(model_file, model_file_checksum)
+
+model = keras.models.load_model(model_file)
+
+def preprocess_input(two_d_array):
+    # Check if the dimensions are 28 x 28
+    assert(len(two_d_array[0])==28)
+    assert(len(two_d_array[1])==28)
+    np_array = np.array(two_d_array)
+    # Expand dimension by 1 for model consumption
+    np_array = (np.expand_dims(np_array,0))
+    return np_array
+
+def apply(input):
+    # Get input text
+    input_vector = preprocess_input(input)
+    # Get probability using our model
+    preds = model.predict(input_vector)
+    probs = list(map(lambda x: float(x), preds[0]))
+    # Return result back to user
+    return {"prob": probs}
diff --git a/model_authentication/model_authentication.ipynb b/model_authentication/model_authentication.ipynb
diff --git a/model_authentication/model_requirements.txt b/model_authentication/model_requirements.txt
@@ -0,0 +1,3 @@
+algorithmia>=1.0.0,<2.0
+six
+tensorflow-gpu==2.0.0
diff --git a/model_authentication/requirements.txt b/model_authentication/requirements.txt
@@ -0,0 +1,8 @@
+tensorflow==2.0.0
+algorithmia==1.2.1
+jupyter==1.0.0
+gitpython==2.1.11
+matplotlib==3.0.2
+urllib3==1.24.3
+retry==0.9.2
+numpy==1.16.1

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+algorithmia>=1.0.0,<2.0`
	`2`	`+six`
	`3`	`+tensorflow-gpu==2.0.0`