In [None]:
# Connection needs environment variables BIGML_USERNAME and BIGML_API_KEY
from bigml.api import BigML
api = BigML()

In [None]:
# create source from remote file
PROJECT_ID = "project/5f91a1b40d052e40ea004b26"
# project id should be changed to the one in your account
source = api.create_source("https://static.bigml.com/csv/diabetes.csv",
                           {"project": PROJECT_ID})
api.ok(source)

In [None]:
# create dataset from source
dataset = api.create_dataset(source)
api.ok(dataset)
dataset_name = dataset["object"]["name"]
print(dataset_name)

In [None]:
# create train dataset
train_dataset = api.create_dataset(dataset,
                                   {"name": "%s - Train" % dataset_name,
                                    "sample_rate": 0.8,
                                    "seed": "bigml"})
api.ok(train_dataset)

In [None]:
# create model from training data
model = api.create_model(train_dataset,
                         {"objective_field": "diabetes"})
api.ok(model)

In [None]:
# create test dataset
test_dataset = api.create_dataset(dataset,
                                  {"name": "%s - Test" % dataset_name,
                                   "sample_rate": 0.8,
                                   "seed": "bigml",
                                   "out_of_bag": True})
api.ok(test_dataset)

In [None]:
# create evaluation from model and test dataset
evaluation = api.create_evaluation(model, test_dataset)
api.ok(evaluation)

In [None]:
print("accuracy: %s" % evaluation["object"]["result"]["model"]["accuracy"])
print("precision: %s" % evaluation["object"]["result"]["model"]["average_precision"])
print("recall: %s" % evaluation["object"]["result"]["model"]["average_recall"])

### LOCAL PREDICTIONS

In [None]:
from bigml.model import Model
local_model = Model(model)
input_data = {"plasma glucose": 130, "bmi": "34"}
local_model.predict(input_data)

In [None]:
from pprint import pprint
pprint(model["object"]["model"]["root"])