#### Dataset Preparation

In [27]:
import numpy as np


np.random.seed(42)
import pandas as pd
from sklearn.datasets import load_wine
from sklearn.model_selection import GridSearchCV
from sklearn.model_selection import train_test_split
from sklearn.tree import DecisionTreeClassifier

In [28]:
dataset = load_wine()
x = dataset.data
y = dataset.target

#### CART Classifier

In [29]:
x_train, x_test, y_train, y_test = train_test_split(x, y, test_size=0.3)

In [30]:
parameters = {
    "criterion": ["gini", "entropy"],
    "max_depth": [None, 2, 4, 8, 10],
    "min_samples_split": [1, 2, 4],
    "min_samples_leaf": [1, 2],
    "max_features": ["sqrt", "log2"],
}

clf = DecisionTreeClassifier()
grid_cv = GridSearchCV(clf, parameters, cv=10, n_jobs=-1)
_ = grid_cv.fit(x_train, y_train)

In [31]:
print(f"Parameters of best model: {grid_cv.best_params_}")
print(f"Score of best model: {grid_cv.best_score_}")

Parameters of best model: {'criterion': 'gini', 'max_depth': 8, 'max_features': 'sqrt', 'min_samples_leaf': 2, 'min_samples_split': 2}
Score of best model: 0.9666666666666666


#### Train Best Model

In [32]:
clf = DecisionTreeClassifier(**grid_cv.best_params_)
clf.fit(x_train, y_train)
score = clf.score(x_test, y_test)

print(f"Accuracy: {score}")

Accuracy: 0.8703703703703703
