# H2O AutoML

### [Documenation](https://docs.h2o.ai/h2o/latest-stable/h2o-docs/automl.html)

In [None]:
# Libraries
import pandas as pd
import h2o
from h2o.automl import H2OAutoML

In [None]:
# Run H2O
h2o.init(max_mem_size='16g')

In [None]:
# Read data
train = h2o.import_file('../input/tabular-playground-series-mar-2021/train.csv')
test = h2o.import_file('../input/tabular-playground-series-mar-2021/test.csv')

In [None]:
# Features
predictors = train.columns[:-1]
target = train.columns[-1]

In [None]:
# For binary classification, response should be a factor
train[target] = train[target].asfactor()

In [None]:
# h2o train
aml = H2OAutoML(
    nfolds=10,
    sort_metric='auc',
    stopping_metric='auc',
    max_runtime_secs=3600*8,
    seed=0
)

aml.train(x=predictors, y=target, training_frame=train)

In [None]:
# View the AutoML Leaderboard
lb = aml.leaderboard
lb.head(rows=lb.nrows)

In [None]:
# Predictions
output = aml.leader.predict(test)
predictions = h2o.as_list(output['p1'])

In [None]:
# Store results
submission = pd.read_csv('../input/tabular-playground-series-mar-2021/test.csv', index_col='id')
submission[target] = predictions.values
submission[target].to_csv('submission.csv')