In [1]:
from flaml import AutoML
from flaml.data import load_openml_dataset

# Download [houses dataset](https://www.openml.org/d/537) from OpenML. The task is to predict median price of the house in the region based on demographic composition and a state of housing market in the region.
X_train, X_test, y_train, y_test = load_openml_dataset(dataset_id=537, data_dir='./')

automl = AutoML()
settings = {
    "time_budget": 60,  # total running time in seconds
    "metric": 'r2',  # primary metrics for regression can be chosen from: ['mae','mse','r2']
    "estimator_list": ['lgbm'],  # list of ML learners; we tune lightgbm in this example
    "task": 'regression',  # task type  
    "log_file_name": 'houses_experiment.log',  # flaml log file
    "seed": 7654321,    # random seed
}
automl.fit(X_train=X_train, y_train=y_train, **settings)

download dataset from openml


[flaml.automl: 04-23 11:06:22] {2105} INFO - task = regression
[flaml.automl: 04-23 11:06:22] {2107} INFO - Data split method: uniform
[flaml.automl: 04-23 11:06:22] {2111} INFO - Evaluation method: cv
[flaml.automl: 04-23 11:06:22] {2188} INFO - Minimizing error metric: 1-r2
[flaml.automl: 04-23 11:06:22] {2281} INFO - List of ML learners in AutoML Run: ['lgbm']
[flaml.automl: 04-23 11:06:22] {2567} INFO - iteration 0, current learner lgbm
[flaml.automl: 04-23 11:06:22] {2697} INFO - Estimated sufficient time budget=919s. Estimated necessary time budget=1s.
[flaml.automl: 04-23 11:06:22] {2744} INFO -  at 0.1s,	estimator lgbm's best error=0.7383,	best estimator lgbm's best error=0.7383
[flaml.automl: 04-23 11:06:22] {2567} INFO - iteration 1, current learner lgbm


Dataset name: houses
X_train.shape: (15480, 8), y_train.shape: (15480,);
X_test.shape: (5160, 8), y_test.shape: (5160,)


[flaml.automl: 04-23 11:06:22] {2744} INFO -  at 0.2s,	estimator lgbm's best error=0.7383,	best estimator lgbm's best error=0.7383
[flaml.automl: 04-23 11:06:22] {2567} INFO - iteration 2, current learner lgbm
[flaml.automl: 04-23 11:06:23] {2744} INFO -  at 0.3s,	estimator lgbm's best error=0.3250,	best estimator lgbm's best error=0.3250
[flaml.automl: 04-23 11:06:23] {2567} INFO - iteration 3, current learner lgbm
[flaml.automl: 04-23 11:06:23] {2744} INFO -  at 0.5s,	estimator lgbm's best error=0.1868,	best estimator lgbm's best error=0.1868
[flaml.automl: 04-23 11:06:23] {2567} INFO - iteration 4, current learner lgbm
[flaml.automl: 04-23 11:06:24] {2744} INFO -  at 1.3s,	estimator lgbm's best error=0.1868,	best estimator lgbm's best error=0.1868
[flaml.automl: 04-23 11:06:24] {2567} INFO - iteration 5, current learner lgbm
[flaml.automl: 04-23 11:06:24] {2744} INFO -  at 1.4s,	estimator lgbm's best error=0.1868,	best estimator lgbm's best error=0.1868
[flaml.automl: 04-23 11:06:24