# Chapter 2 - Automated Machine Learning On Azure

### Create a Compute Cluster to Run your AutoML Jobs

In [7]:
# Import libraries necessary to create a Compute Cluster

import azureml.core
from azureml.core.workspace import Workspace
from azureml.core.compute import ComputeTarget, AmlCompute

In [8]:
# Connect to your Azure Machine Learning Workspace

ws  = Workspace.from_config()

In [9]:
# Set variables used in creating your Compute Cluster

compute_name = 'automl-cluster' # Name of your Compute Cluster
compute_min_nodes = 0           # Mininum number of Nodes your Compute Cluster will scale down to at rest
compute_max_nodes = 4           # Maximum number of Nodes your Compute Cluster will scale up to while running your job
vm_size = 'Standard_DS3_v2'     # Type of Virtual Machines your Compute Cluster consists of
idle_seconds = 1200             # Time before your Compute Cluster will scale down to your Minimum Number of Nodes


In [12]:
# Set your Compute Cluster configurations using the variables you created above

Compute_Config = AmlCompute.provisioning_configuration(vm_size=vm_size,\
                                                       min_nodes=compute_min_nodes,\
                                                       max_nodes=compute_max_nodes,\
                                                       idle_seconds_before_scaledown = idle_seconds)

In [15]:
# Create your Compute Cluster
compute_target = ComputeTarget.create(ws, compute_name, Compute_Config)
compute_target.wait_for_completion(show_output=True)


Succeeded
AmlCompute wait for completion finished

Minimum number of nodes requested have been provisioned


### Create a Dataset to train an Automated Machine Learning Model

In [16]:
# Import libraries necessary to create a Dataset from the Azure Open Datasets Diabetes sample data

from azureml.opendatasets import Diabetes
from azureml.core import Dataset

In [17]:
# Create a Dataset from the Diabetes sample data

diabetes_tabular = Diabetes.get_tabular_dataset()

In [18]:
# Connect to your Azure Machine Learning Workspace

from azureml.core.workspace import Workspace
ws  = Workspace.from_config()

In [20]:
# Register the Dataset to your AMLS Workspace
diabetes = diabetes_tabular.register(workspace=ws, name='Diabetes Sample')


In [23]:
# View the contents of your Dataset
diabetes.to_pandas_dataframe().head(5)

Unnamed: 0,AGE,SEX,BMI,BP,S1,S2,S3,S4,S5,S6,Y
0,59,2,32.1,101.0,157,93.2,38.0,4.0,4.8598,87,151
1,48,1,21.6,87.0,183,103.2,70.0,3.0,3.8918,69,75
2,72,2,30.5,93.0,156,93.6,41.0,4.0,4.6728,85,141
3,24,1,25.3,84.0,198,131.4,40.0,5.0,4.8903,89,206
4,50,1,23.0,101.0,192,125.4,52.0,4.0,4.2905,80,135
