# 1. Stacking

In [1]:
from sklearn.model_selection import train_test_split
from sklearn.ensemble import StackingClassifier
from sklearn.tree import DecisionTreeClassifier
from sklearn.linear_model import LogisticRegression
from sklearn.svm import SVC
from sklearn.metrics import accuracy_score, classification_report
import seaborn as sns

In [2]:
data = sns.load_dataset("iris")

In [3]:
data.head()

Unnamed: 0,sepal_length,sepal_width,petal_length,petal_width,species
0,5.1,3.5,1.4,0.2,setosa
1,4.9,3.0,1.4,0.2,setosa
2,4.7,3.2,1.3,0.2,setosa
3,4.6,3.1,1.5,0.2,setosa
4,5.0,3.6,1.4,0.2,setosa


In [4]:
X = data.drop(columns = ["species"], axis = 1)
y = data["species"]

In [6]:
from sklearn.preprocessing import LabelEncoder
encoder = LabelEncoder()
y_encoded = encoder.fit_transform(y)

In [7]:
X_train, X_test, y_train, y_test = train_test_split(X, y_encoded, test_size = 0.3, stratify = y_encoded, random_state = 42)

In [14]:
base_models = [
    ("dt", DecisionTreeClassifier(random_state = 42)),
    ("svc", SVC(probability = True, kernel = "rbf", random_state = 42)),
    ("lr", LogisticRegression(max_iter = 100))
]

In [15]:
meta_model = LogisticRegression(max_iter = 100)

In [16]:
stacking_clf = StackingClassifier(
    estimators = base_models,
    final_estimator = meta_model,
    cv = 5
)

In [17]:
stacking_clf.fit(X_train, y_train)

STOP: TOTAL NO. OF ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression
  n_iter_i = _check_optimize_result(


In [18]:
y_pred = stacking_clf.predict(X_test)

In [19]:
accuracy_score(y_test, y_pred)

0.9555555555555556

# 2. Bagging

In [20]:
from sklearn.ensemble import RandomForestClassifier

In [22]:
rf_model = RandomForestClassifier(
    n_estimators = 100,
    max_depth = None,
    random_state = 42
)

In [23]:
rf_model.fit(X_train, y_train)

In [24]:
rf_model_pred = rf_model.predict(X_test)

In [25]:
accuracy_score(y_test, rf_model_pred)

0.8888888888888888

# 3. Boosting

In [27]:
from sklearn.ensemble import AdaBoostClassifier
from sklearn.ensemble import GradientBoostingClassifier
from xgboost import XGBClassifier

In [29]:
ada_model = AdaBoostClassifier(
    n_estimators = 100,
    random_state = 42
)

In [31]:
ada_model.fit(X_train, y_train)
ada_model_pred = ada_model.predict(X_test)

In [32]:
accuracy_score(y_test, ada_model_pred)

0.9333333333333333

In [33]:
grad_model = GradientBoostingClassifier(
    n_estimators = 100,
    random_state = 42
)

In [34]:
grad_model.fit(X_train, y_train)
grad_model_pred = grad_model.predict(X_test)

In [35]:
accuracy_score(y_test, grad_model_pred)

0.9333333333333333

In [37]:
xgb_model = XGBClassifier(
    n_estimators = 100,
    learning_rate = 0.1,
    max_depth = 3,
    use_label_encoder = False,
    eval_metrics = "mlogloss",
    random_state = 42
)

In [39]:
xgb_model.fit(X_train, y_train)
xgb_model_pred = xgb_model.predict(X_test)

In [40]:
accuracy_score(y_test, xgb_model_pred)

0.9333333333333333