From 481257f4dea19541aee5520154b94e8f86e292e5 Mon Sep 17 00:00:00 2001
From: Omer Spillinger <ospillinger@users.noreply.github.com>
Date: Sun, 1 Dec 2019 23:39:11 -0800
Subject: [PATCH] Update docs

---
 README.md                                     |  21 ++-
 docs/cluster-management/install.md            |   4 +-
 examples/sklearn/iris-classifier/README.md    | 151 ++++++++++++++++--
 .../iris-classifier/batch-predictor.py        |  20 +++
 examples/sklearn/iris-classifier/cortex.yaml  |  13 +-
 examples/sklearn/iris-classifier/predictor.py |  20 ++-
 examples/sklearn/iris-classifier/sample.json  |   2 +-
 examples/sklearn/iris-classifier/samples.json |  20 +++
 8 files changed, 210 insertions(+), 41 deletions(-)
 create mode 100644 examples/sklearn/iris-classifier/batch-predictor.py
 create mode 100644 examples/sklearn/iris-classifier/samples.json
diff --git a/README.md b/README.md
index 1691ae83b2..76dcaa6747 100644
--- a/README.md
+++ b/README.md
@@ -1,6 +1,6 @@
 # Deploy machine learning models in production
 
-Cortex is an open source platform for deploying machine learning models—trained with nearly any framework—as production web services.
+Cortex is an open source platform for deploying machine learning models as production web services.
 
 <br>
 
@@ -15,29 +15,34 @@ Cortex is an open source platform for deploying machine learning models—traine
 
 ## Key features
 
-* **Autoscaling:** Cortex automatically scales APIs to handle production workloads.
 * **Multi framework:** Cortex supports TensorFlow, PyTorch, scikit-learn, XGBoost, and more.
+* **Autoscaling:** Cortex automatically scales APIs to handle production workloads.
 * **CPU / GPU support:** Cortex can run inference on CPU or GPU infrastructure.
 * **Spot instances:** Cortex supports EC2 spot instances.
 * **Rolling updates:** Cortex updates deployed APIs without any downtime.
 * **Log streaming:** Cortex streams logs from deployed models to your CLI.
 * **Prediction monitoring:** Cortex monitors network metrics and tracks predictions.
-* **Minimal configuration:** Deployments are defined in a single `cortex.yaml` file.
+* **Minimal configuration:** deployments are defined in a single `cortex.yaml` file.
 
 <br>
 
-## Spinning up a Cortex cluster
+## Spinning up a cluster
 
-Cortex is designed to be self-hosted on any AWS account. You can spin up a Cortex cluster with a single command:
+Cortex is designed to be self-hosted on any AWS account. You can spin up a cluster with a single command:
 
+<!-- CORTEX_VERSION_README_MINOR -->
 ```bash
+# install the CLI on your machine
+$ bash -c "$(curl -sS https://raw.githubusercontent.com/cortexlabs/cortex/0.11/get-cli.sh)"
+
+# provision infrastructure on AWS and spin up a cluster
 $ cortex cluster up
 
 aws region: us-west-2
 aws instance type: p2.xlarge
+spot instances: yes
 min instances: 0
 max instances: 10
-spot instances: yes
 
 ￮ spinning up your cluster ...
 your cluster is ready!
@@ -110,9 +115,9 @@ negative  4
 
 <br>
 
-## What is Cortex an alternative to?
+## What is Cortex similar to?
 
-Cortex is an open source alternative to serving models with SageMaker or building your own model deployment platform on top of AWS services like Elastic Kubernetes Service (EKS), Elastic Container Service (ECS), Lambda, Fargate, and Elastic Compute Cloud (EC2) or open source projects like Docker, Kubernetes, and TensorFlow Serving.
+Cortex is an open source alternative to serving models with SageMaker or building your own model deployment platform on top of AWS services like Elastic Kubernetes Service (EKS), Elastic Container Service (ECS), Lambda, Fargate, and Elastic Compute Cloud (EC2) and open source projects like Docker, Kubernetes, and TensorFlow Serving.
 
 <br>
 
diff --git a/docs/cluster-management/install.md b/docs/cluster-management/install.md
index 5b6efb455d..18eae07ef4 100644
--- a/docs/cluster-management/install.md
+++ b/docs/cluster-management/install.md
@@ -11,10 +11,10 @@ See [cluster configuration](config.md) to learn how you can customize your clust
 
 <!-- CORTEX_VERSION_MINOR -->
 ```bash
-# install the Cortex CLI on your machine
+# install the CLI on your machine
 bash -c "$(curl -sS https://raw.githubusercontent.com/cortexlabs/cortex/master/get-cli.sh)"
 
-# provision infrastructure on AWS and install Cortex
+# provision infrastructure on AWS and spin up a cluster
 cortex cluster up
 ```
 
diff --git a/examples/sklearn/iris-classifier/README.md b/examples/sklearn/iris-classifier/README.md
index 91151b7606..802b417235 100644
--- a/examples/sklearn/iris-classifier/README.md
+++ b/examples/sklearn/iris-classifier/README.md
@@ -58,11 +58,11 @@ $ python3 trainer.py
 # predictor.py
 
 import pickle
-import numpy
+import numpy as np
 
 
 model = None
-labels = ["iris-setosa", "iris-versicolor", "iris-virginica"]
+labels = ["setosa", "versicolor", "virginica"]
 
 
 def init(model_path, metadata):
@@ -71,16 +71,14 @@ def init(model_path, metadata):
 
 
 def predict(sample, metadata):
-    input_array = numpy.array(
-        [
-            sample["sepal_length"],
-            sample["sepal_width"],
-            sample["petal_length"],
-            sample["petal_width"],
-        ]
-    )
-
-    label_id = model.predict([input_array])[0]
+    measurements = [
+        sample["sepal_length"],
+        sample["sepal_width"],
+        sample["petal_length"],
+        sample["petal_width"],
+    ]
+
+    label_id = model.predict(np.array([measurements]))[0]
     return labels[label_id]
 ```
 
@@ -153,7 +151,7 @@ $ curl http://***.amazonaws.com/iris/classifier \
     -X POST -H "Content-Type: application/json" \
     -d '{"sepal_length": 5.2, "sepal_width": 3.6, "petal_length": 1.4, "petal_width": 0.3}'
 
-"iris-setosa"
+"setosa"
 ```
 
 <br>
@@ -214,7 +212,7 @@ This model is fairly small but larger models may require more compute resources.
   tracker:
     model_type: classification
   compute:
-    cpu: 1
+    cpu: 0.5
     mem: 1G
 ```
 
@@ -257,7 +255,7 @@ If you trained another model and want to A/B test it with your previous model, s
   tracker:
     model_type: classification
   compute:
-    cpu: 1
+    cpu: 0.5
     mem: 1G
 
 - kind: api
@@ -268,7 +266,7 @@ If you trained another model and want to A/B test it with your previous model, s
   tracker:
     model_type: classification
   compute:
-    cpu: 1
+    cpu: 0.5
     mem: 1G
 ```
 
@@ -286,8 +284,126 @@ creating another-classifier api
 $ cortex get --watch
 
 api                  status   up-to-date   available   requested   last update
-another-classifier   live     1            1           1           8s
 classifier           live     1            1           1           5m
+another-classifier   live     1            1           1           8s
+```
+
+## Add a batch API
+
+First, implement `batch-predictor.py` with a `predict` function that can process an array of samples:
+
+```python
+# batch-predictor.py
+
+import pickle
+import numpy as np
+
+
+model = None
+labels = ["setosa", "versicolor", "virginica"]
+
+
+def init(model_path, metadata):
+    global model
+    model = pickle.load(open(model_path, "rb"))
+
+
+def predict(sample, metadata):
+    measurements = [
+        [s["sepal_length"], s["sepal_width"], s["petal_length"], s["petal_width"]] for s in sample
+    ]
+
+    label_ids = model.predict(np.array(measurements))
+    return [labels[label_id] for label_id in label_ids]
+```
+
+Next, add the `api` to `cortex.yaml`:
+
+```yaml
+- kind: deployment
+  name: iris
+
+- kind: api
+  name: classifier
+  predictor:
+    path: predictor.py
+    model: s3://cortex-examples/sklearn/iris-classifier/model.pkl
+  tracker:
+    model_type: classification
+  compute:
+    cpu: 0.5
+    mem: 1G
+
+- kind: api
+  name: another-classifier
+  predictor:
+    path: predictor.py
+    model: s3://cortex-examples/sklearn/iris-classifier/another-model.pkl
+  tracker:
+    model_type: classification
+  compute:
+    cpu: 0.5
+    mem: 1G
+
+
+- kind: api
+  name: batch-classifier
+  predictor:
+    path: batch-predictor.py
+    model: s3://cortex-examples/sklearn/iris-classifier/model.pkl
+  compute:
+    cpu: 0.5
+    mem: 1G
+```
+
+Run `cortex deploy` to create the batch API:
+
+```bash
+$ cortex deploy
+
+creating batch-classifier api
+```
+
+`cortex get` should show all three APIs now:
+
+```bash
+$ cortex get --watch
+
+api                  status   up-to-date   available   requested   last update
+classifier           live     1            1           1           10m
+another-classifier   live     1            1           1           5m
+batch-classifier     live     1            1           1           8s
+```
+
+<br>
+
+## Try a batch prediction
+
+```bash
+$ curl http://***.amazonaws.com/iris/classifier \
+    -X POST -H "Content-Type: application/json" \
+    -d '[
+          {
+        		"sepal_length": 5.2,
+        		"sepal_width": 3.6,
+        		"petal_length": 1.5,
+        		"petal_width": 0.3
+        	},
+        	{
+        		"sepal_length": 7.1,
+        		"sepal_width": 3.3,
+        		"petal_length": 4.8,
+        		"petal_width": 1.5
+        	},
+        	{
+        		"sepal_length": 6.4,
+        		"sepal_width": 3.4,
+        		"petal_length": 6.1,
+        		"petal_width": 2.6
+        	}
+        ]'
+
+["setosa","versicolor","virginica"]
 ```
 
 <br>
@@ -301,6 +417,7 @@ $ cortex delete
 
 deleting classifier api
 deleting another-classifier api
+deleting batch-classifier api
 ```
 
 Running `cortex delete` will free up cluster resources and allow Cortex to scale down to the minimum number of instances you specified during cluster installation. It will not spin down your cluster.
diff --git a/examples/sklearn/iris-classifier/batch-predictor.py b/examples/sklearn/iris-classifier/batch-predictor.py
new file mode 100644
index 0000000000..5eb818bc3c
--- /dev/null
+++ b/examples/sklearn/iris-classifier/batch-predictor.py
@@ -0,0 +1,20 @@
+import pickle
+import numpy as np
+
+
+model = None
+labels = ["setosa", "versicolor", "virginica"]
+
+
+def init(model_path, metadata):
+    global model
+    model = pickle.load(open(model_path, "rb"))
+
+
+def predict(sample, metadata):
+    measurements = [
+        [s["sepal_length"], s["sepal_width"], s["petal_length"], s["petal_width"]] for s in sample
+    ]
+
+    label_ids = model.predict(np.array(measurements))
+    return [labels[label_id] for label_id in label_ids]
diff --git a/examples/sklearn/iris-classifier/cortex.yaml b/examples/sklearn/iris-classifier/cortex.yaml
index ad18a402aa..da78546b70 100644
--- a/examples/sklearn/iris-classifier/cortex.yaml
+++ b/examples/sklearn/iris-classifier/cortex.yaml
@@ -9,7 +9,7 @@
   tracker:
     model_type: classification
   compute:
-    cpu: 1
+    cpu: 0.5
     mem: 1G
 
 - kind: api
@@ -20,5 +20,14 @@
   tracker:
     model_type: classification
   compute:
-    cpu: 1
+    cpu: 0.5
+    mem: 1G
+
+- kind: api
+  name: batch-classifier
+  predictor:
+    path: batch-predictor.py
+    model: s3://cortex-examples/sklearn/iris-classifier/model.pkl
+  compute:
+    cpu: 0.5
     mem: 1G
diff --git a/examples/sklearn/iris-classifier/predictor.py b/examples/sklearn/iris-classifier/predictor.py
index e3c387e4bf..d8fbad9843 100644
--- a/examples/sklearn/iris-classifier/predictor.py
+++ b/examples/sklearn/iris-classifier/predictor.py
@@ -1,9 +1,9 @@
 import pickle
-import numpy
+import numpy as np
 
 
 model = None
-labels = ["iris-setosa", "iris-versicolor", "iris-virginica"]
+labels = ["setosa", "versicolor", "virginica"]
 
 
 def init(model_path, metadata):
@@ -12,14 +12,12 @@ def init(model_path, metadata):
 
 
 def predict(sample, metadata):
-    input_array = numpy.array(
-        [
-            sample["sepal_length"],
-            sample["sepal_width"],
-            sample["petal_length"],
-            sample["petal_width"],
-        ]
-    )
+    measurements = [
+        sample["sepal_length"],
+        sample["sepal_width"],
+        sample["petal_length"],
+        sample["petal_width"],
+    ]
 
-    label_id = model.predict([input_array])[0]
+    label_id = model.predict(np.array([measurements]))[0]
     return labels[label_id]
diff --git a/examples/sklearn/iris-classifier/sample.json b/examples/sklearn/iris-classifier/sample.json
index 252c666b3a..9e792863cd 100644
--- a/examples/sklearn/iris-classifier/sample.json
+++ b/examples/sklearn/iris-classifier/sample.json
@@ -1,6 +1,6 @@
 {
   "sepal_length": 5.2,
   "sepal_width": 3.6,
-  "petal_length": 1.4,
+  "petal_length": 1.5,
   "petal_width": 0.3
 }
diff --git a/examples/sklearn/iris-classifier/samples.json b/examples/sklearn/iris-classifier/samples.json
new file mode 100644
index 0000000000..2de60e1dc0
--- /dev/null
+++ b/examples/sklearn/iris-classifier/samples.json
@@ -0,0 +1,20 @@
+[
+  {
+		"sepal_length": 5.2,
+		"sepal_width": 3.6,
+		"petal_length": 1.5,
+		"petal_width": 0.3
+	},
+	{
+		"sepal_length": 7.1,
+		"sepal_width": 3.3,
+		"petal_length": 4.8,
+		"petal_width": 1.5
+	},
+	{
+		"sepal_length": 6.4,
+		"sepal_width": 3.4,
+		"petal_length": 6.1,
+		"petal_width": 2.6
+	}
+]