# How to Develop a Bagging Ensemble with Python - Classification
From tutorial [https://machinelearningmastery.com/bagging-ensemble-with-python/](https://machinelearningmastery.com/bagging-ensemble-with-python/)

In [1]:
from numpy import mean
from numpy import std
from sklearn.datasets import make_classification
from sklearn.model_selection import cross_val_score
from sklearn.model_selection import RepeatedStratifiedKFold
from sklearn.ensemble import BaggingClassifier

## Test classification dataset

In [2]:
# define dataset, n_classes=2 (default)
X, y = make_classification(n_samples=1000, n_features=20, n_informative=15, n_redundant=5, random_state=5)
# summarize the dataset
print(X.shape, y.shape)

(1000, 20) (1000,)


## Evaluate bagging algorithm for classification
[Documentation about class `BaggingClassifier`](https://scikit-learn.org/stable/modules/generated/sklearn.ensemble.BaggingClassifier.html)

In [3]:
# define the model
model = BaggingClassifier()
# evaluate the model
cv = RepeatedStratifiedKFold(n_splits=10, n_repeats=3, random_state=1)
n_scores = cross_val_score(model, X, y, scoring='accuracy', cv=cv, n_jobs=-1, error_score='raise')
print("n_scores =", n_scores)
print("n_scores.length =", len(n_scores))
# report performance
print('Accuracy: %.3f (%.3f)' % (mean(n_scores), std(n_scores)))

n_scores = [0.89 0.89 0.8  0.83 0.88 0.88 0.92 0.86 0.91 0.86 0.9  0.82 0.79 0.8
 0.84 0.88 0.89 0.89 0.92 0.87 0.9  0.88 0.79 0.88 0.84 0.82 0.87 0.9
 0.83 0.84]
n_scores.length = 30
Accuracy: 0.862 (0.038)


## Make predictions using bagging for classification

In [4]:
# fit the model on the whole dataset
model.fit(X, y)
# make a single prediction
row = [[-4.7705504,-1.88685058,-0.96057964,2.53850317,-6.5843005,3.45711663,-7.46225013,2.01338213,-0.45086384,-1.89314931,-2.90675203,-0.21214568,-0.9623956,3.93862591,0.06276375,0.33964269,4.0835676,1.31423977,-2.17983117,3.1047287]]
yhat = model.predict(row)
print('Predicted Class: %d' % yhat[0])

Predicted Class: 1
