In [1]:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

In [2]:
from sklearn.model_selection import train_test_split
from sklearn.ensemble import StackingClassifier
from sklearn.tree import DecisionTreeClassifier
from sklearn.linear_model import LogisticRegression
from sklearn.svm import SVC
from sklearn.metrics import accuracy_score,classification_report
from sklearn.preprocessing import LabelEncoder


In [3]:
df = sns.load_dataset("iris")
df.head()

Unnamed: 0,sepal_length,sepal_width,petal_length,petal_width,species
0,5.1,3.5,1.4,0.2,setosa
1,4.9,3.0,1.4,0.2,setosa
2,4.7,3.2,1.3,0.2,setosa
3,4.6,3.1,1.5,0.2,setosa
4,5.0,3.6,1.4,0.2,setosa


In [4]:
X = df.drop('species',axis=1)
y = df['species']

In [5]:
le = LabelEncoder()
y_encoded = le.fit_transform(y)

In [6]:
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42,stratify=y_encoded)

In [7]:
base_learners = [
    ('dt',DecisionTreeClassifier(random_state=42)),
    ('svc',SVC(probability=True,kernel='rbf', random_state=42)),
    ('lr',LogisticRegression(max_iter=1000)),
]

In [8]:
meta_learner = LogisticRegression(max_iter=1000)

In [9]:
stacking_clf = StackingClassifier(
    estimators=base_learners,
    final_estimator=meta_learner,
    cv=5
)

In [10]:
stacking_clf.fit(X_train,y_train)

0,1,2
,estimators,"[('dt', ...), ('svc', ...), ...]"
,final_estimator,LogisticRegre...max_iter=1000)
,cv,5
,stack_method,'auto'
,n_jobs,
,passthrough,False
,verbose,0

0,1,2
,criterion,'gini'
,splitter,'best'
,max_depth,
,min_samples_split,2
,min_samples_leaf,1
,min_weight_fraction_leaf,0.0
,max_features,
,random_state,42
,max_leaf_nodes,
,min_impurity_decrease,0.0

0,1,2
,C,1.0
,kernel,'rbf'
,degree,3
,gamma,'scale'
,coef0,0.0
,shrinking,True
,probability,True
,tol,0.001
,cache_size,200
,class_weight,

0,1,2
,penalty,'l2'
,dual,False
,tol,0.0001
,C,1.0
,fit_intercept,True
,intercept_scaling,1
,class_weight,
,random_state,
,solver,'lbfgs'
,max_iter,1000

0,1,2
,penalty,'l2'
,dual,False
,tol,0.0001
,C,1.0
,fit_intercept,True
,intercept_scaling,1
,class_weight,
,random_state,
,solver,'lbfgs'
,max_iter,1000


In [11]:
y_pred = stacking_clf.predict(X_test)

In [12]:
accuracy = accuracy_score(y_test,y_pred)

In [13]:
accuracy

0.9666666666666667

In [14]:
#Random forest 

In [15]:
from sklearn.ensemble import RandomForestClassifier

In [16]:
rf_model = RandomForestClassifier(
    n_estimators=100, #number of trees
    max_depth=None, #letting trees grow fully
    random_state=42
)

In [17]:
rf_model.fit(X_train,y_train)

0,1,2
,n_estimators,100
,criterion,'gini'
,max_depth,
,min_samples_split,2
,min_samples_leaf,1
,min_weight_fraction_leaf,0.0
,max_features,'sqrt'
,max_leaf_nodes,
,min_impurity_decrease,0.0
,bootstrap,True


In [18]:
y_pred = rf_model.predict(X_test)

In [19]:
accuracy = accuracy_score(y_test,y_pred)
accuracy

0.9

In [20]:
#adaboost, gradient boost, xgboost

In [21]:
from sklearn.ensemble import AdaBoostClassifier, GradientBoostingClassifier

In [22]:
%pip install xgboost

Note: you may need to restart the kernel to use updated packages.



[notice] A new release of pip is available: 25.2 -> 25.3
[notice] To update, run: python.exe -m pip install --upgrade pip


In [23]:
import xgboost as xgb

In [24]:
from xgboost import XGBClassifier

In [25]:
ada_model = AdaBoostClassifier(n_estimators=100,random_state=42)

In [26]:
ada_model.fit(X_train,y_train)

0,1,2
,estimator,
,n_estimators,100
,learning_rate,1.0
,algorithm,'deprecated'
,random_state,42


In [27]:
y_pred = ada_model.predict(X_test)

In [28]:
accuracy = accuracy_score(y_test,y_pred)
accuracy

0.9333333333333333

In [29]:
gb_model = GradientBoostingClassifier(n_estimators=100,learning_rate=0.1,random_state=42)

In [30]:
gb_model.fit(X_train,y_train)

0,1,2
,loss,'log_loss'
,learning_rate,0.1
,n_estimators,100
,subsample,1.0
,criterion,'friedman_mse'
,min_samples_split,2
,min_samples_leaf,1
,min_weight_fraction_leaf,0.0
,max_depth,3
,min_impurity_decrease,0.0


In [31]:
y_pred = gb_model.predict(X_test)

In [32]:
accuracy = accuracy_score(y_test,y_pred)
accuracy

0.9666666666666667

In [33]:
# Encode labels
le = LabelEncoder()
y_train_enc = le.fit_transform(y_train)
y_test_enc = le.transform(y_test)

# Model
xgb_model = XGBClassifier(
    n_estimators=100,
    learning_rate=0.1,
    max_depth=3,
    eval_metric='mlogloss',
    random_state=42
)

# Train
xgb_model.fit(X_train, y_train_enc)

# Predict
y_pred = xgb_model.predict(X_test)

# Accuracy
accuracy = accuracy_score(y_test_enc, y_pred)
print("Accuracy:", accuracy)

Accuracy: 0.9333333333333333
