In [None]:
K8S_PROXY_ADDR='127.0.0.1:8001'
K8S_NAMESPACE='mdt'
APP_NAME='tf-classification'
MODEL_NAME='clipper-tf-predict'
MODEL_FILE='model.ckpt'
REPO_URL='658391232643.dkr.ecr.us-west-2.amazonaws.com'
VERSION = 1

Train the Model and persist it into a pickle file

In [None]:
from __future__ import print_function

import tensorflow as tf
from tensorflow.contrib.tensor_forest.python import tensor_forest
from tensorflow.python.ops import resources

from sklearn.datasets import load_iris
from sklearn.model_selection import train_test_split

import numpy as np

# Ignore all GPUs, tf random forest does not benefit from it.
import os
os.environ["CUDA_VISIBLE_DEVICES"] = ""

data = load_iris()
dX, dy = data["data"], data["target"]
X_train, X_test, y_train, y_test = train_test_split(
    dX, dy, test_size=0.33, random_state=42)

# Parameters
num_steps = 500  # Total steps to train
batch_size = 10  # The number of samples per batch
num_classes = 3  # The 10 digits
num_features = 4  # Each image is 28x28 pixels
num_trees = 10
max_nodes = 100

# Input and Target data
X = tf.placeholder(tf.float32, shape=[None, num_features])
# For random forest, labels must be integers (the class id)
Y = tf.placeholder(tf.int32, shape=[None])

# Random Forest Parameters
hparams = tensor_forest.ForestHParams(num_classes=num_classes,
                                      num_features=num_features,
                                      num_trees=num_trees,
                                      max_nodes=max_nodes).fill()

# Build the Random Forest
forest_graph = tensor_forest.RandomForestGraphs(hparams)
# Get training graph and loss
train_op = forest_graph.training_graph(X, Y)
loss_op = forest_graph.training_loss(X, Y)

# Measure the accuracy
infer_op, _, _ = forest_graph.inference_graph(X)
correct_prediction = tf.equal(tf.argmax(infer_op, 1), tf.cast(Y, tf.int64))
accuracy_op = tf.reduce_mean(tf.cast(correct_prediction, tf.float32))

# Initialize the variables (i.e. assign their default value) and forest resources
init_vars = tf.group(tf.global_variables_initializer(),
                     resources.initialize_resources(resources.shared_resources()))


def next_batch(size):
    index = range(len(X_train))
    index_batch = np.random.choice(index, size)
    return X_train[index_batch], y_train[index_batch]


# Start TensorFlow session
sess = tf.Session()

# Run the initializer
sess.run(init_vars)

saver = tf.train.Saver()

# Training
for i in range(1, num_steps + 1):
    # Prepare Data
    # Get the next batch of MNIST data (only images are needed, not labels)
    batch_x, batch_y = next_batch(batch_size)
    _, l = sess.run([train_op, loss_op], feed_dict={X: batch_x, Y: batch_y})
    if i % 50 == 0 or i == 1:
        acc = sess.run(accuracy_op, feed_dict={X: batch_x, Y: batch_y})
        print('Step %i, Loss: %f, Acc: %f' % (i, l, acc))
# Test Model
print("Test Accuracy:", sess.run(
    accuracy_op, feed_dict={X: X_test, Y: y_test}))

# Print the tensors related to this model
print(accuracy_op)
print(infer_op)
print(X)
print(Y)

# save the model to a check point file
save_path = saver.save(sess, "./model.ckpt")

Connect to clipper and register App

In [None]:
from clipper_admin import ClipperConnection, KubernetesContainerManager
manager = KubernetesContainerManager(
    kubernetes_proxy_addr=K8S_PROXY_ADDR, namespace=K8S_NAMESPACE)
clipper_conn = ClipperConnection(manager)
clipper_conn.connect()

clipper_conn.register_application(
   name = APP_NAME, input_type = 'doubles', default_output = '0', slo_micros = 100000000)

Create a prediction function by loading the model

In [None]:
sess = tf.Session()
graph = tf.get_default_graph()
saver = tf.train.import_meta_graph(
    'model.ckpt.meta')
saver.restore(sess, 'model.ckpt')
load_infer_op = graph.get_tensor_by_name('probabilities:0')
accuracy_op = graph.get_tensor_by_name('Mean_1:0')
oX = graph.get_tensor_by_name('Placeholder:0')
oY = graph.get_tensor_by_name('Placeholder_1:0')

def predict(X):
    print("inputs {}".format(X))
    result = sess.run(load_infer_op, feed_dict={oX: X})
    ret = [str(i) for i in result]
    print("return is {}".format(ret))
    return ret

print(predict([[5.9, 3.0, 5.1, 1.8]]))

Failed to pickle using clipper python deploy function, this is a known issue for pickling cython class. https://stackoverflow.com/questions/12646436/pickle-cython-class

In [None]:
from clipper_admin.deployers import python as python_deployer
python_deployer.deploy_python_closure(clipper_conn,
                                      name=MODEL_NAME,
                                      version=VERSION,
                                      input_type="doubles",
                                      func=predict,
                                      registry=REPO_URL,
                                      pkgs_to_install=['tensorflow'])

Failed to deploy using tensorflow as well.

In [None]:
from clipper_admin.deployers.tensorflow import deploy_tensorflow_model

deploy_tensorflow_model(clipper_conn,
                        name=MODEL_NAME,
                        version=VERSION,
                        input_type="doubles",
                        func=predict,
                        tf_sess_or_saved_model_path=sess,
                        registry=REPO_URL,
                        pkgs_to_install=['tensorflow'])

Link the model to application

In [None]:
clipper_conn.link_model_to_app(app_name=APP_NAME, model_name=MODEL_NAME)

test it

In [None]:
import requests, json, numpy as np
def predict():
    headers = {"Content-type": "application/json"}
    data=json.dumps({"input": [5.9, 3.0, 5.1, 1.8]})
    print(data)
    url = "http://{}/api/v1/namespaces/{}/services/query-frontend-at-default-cluster:1337/proxy/{}/predict".format(K8S_PROXY_ADDR,K8S_NAMESPACE,APP_NAME)
    res = requests.post(url, headers=headers, data=data)
    print(res.json())

predict() 