In [7]:
import pandas as pd
import numpy as np
import seaborn as sns
import matplotlib.pyplot as plt
import sys
sys.path.append('..')
from utils_cd import (
        split_dataset,
        standard_deviation,
        plot_comparison_results,
        impute_values,
        plot_results,
        plot_param_improv,
        plot_results_from_csv,
        aps_classifier_statistics
)
from sklearn.neighbors import KNeighborsClassifier
from sklearn.tree import DecisionTreeClassifier
from sklearn.ensemble import RandomForestClassifier
from sklearn.naive_bayes import GaussianNB, MultinomialNB, BernoulliNB
from sklearn.decomposition import PCA
from sklearn.feature_selection import SelectKBest
from sklearn.feature_selection import chi2
from sklearn.preprocessing import Normalizer, StandardScaler
from imblearn.over_sampling import SMOTE
from imblearn.under_sampling import RandomUnderSampler
from sklearn.decomposition import PCA

pd.options.display.max_columns = None
sns.set(style='darkgrid')

CLASS = 'class'
train = pd.read_csv('./aps_failure_training_set.csv',
                        skiprows=20,keep_default_na=False, na_values='na')
test = pd.read_csv('./aps_failure_test_set.csv',
                        skiprows=20,keep_default_na=False, na_values='na')

X_train, y_train = split_dataset(train, CLASS)
X_test, y_test = split_dataset(test, CLASS)
y_train = y_train.map({'pos': 1, 'neg': 0})
y_test = y_test.map({'pos': 1, 'neg': 0})

X_train, X_test = X_train.reset_index(drop=True), X_test.reset_index(drop=True)

def normalize(X_train, X_test):
    normalizer = Normalizer().fit(X_train)

    X_train_norm = normalizer.transform(X_train)
    X_test_norm = normalizer.transform(X_test)
    
    return X_train_norm, X_test_norm

aps = pd.concat([X_train, X_test])

clf = DecisionTreeClassifier(random_state=42)
min_samples = np.concatenate([np.arange(5, 51, 5), np.arange(100, 1001, 100)])
results = {}
res_i = 0

In [3]:
min_samples

array([   5,   10,   15,   20,   25,   30,   35,   40,   45,   50,  100,
        200,  300,  400,  500,  600,  700,  800,  900, 1000])

In [8]:
X_train, X_test = X_train.fillna(X_train.median()), X_test.fillna(X_train.median())

In [52]:
res = aps_classifier_statistics(clf, X_train, X_test, y_train, y_test)
results[res_i] = {'Price': res['score'], 'Transformation': 'Baseline'}
res_i += 1
print(res)

{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.9889375, 'confusion_matrix': array([[15561,    64],
       [  113,   262]]), 'sensibility': 0.6986666666666667, 'specificity': 0.995904, 'score': 57140}


In [9]:
balancers = [(RandomUnderSampler(random_state=42), 'Undersample 50-50'), (RandomUnderSampler(ratio=0.3, random_state=42), 'Undersample 70-30'), (SMOTE(ratio=1.0, random_state=42), 'SMOTE 50-50'), (SMOTE(ratio=0.3, random_state=42), 'SMOTE 70-30')]
filename = 'dt_balancing'
measures = {}
i = 0

for samples in min_samples:
    for balancer, name in balancers:
        X_train_bal, y_train_bal = balancer.fit_sample(X_train, y_train)
        res = aps_classifier_statistics(DecisionTreeClassifier(min_samples_split=samples), X_train_bal, X_test, y_train_bal, y_test)
        print(res)

        measures[i] = {'Price': res['score'], 'Technique': name, 'Min Samples to Split': samples, 'Leafs': res['clf'].tree_.node_count}
        i += 1



{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.933125, 'confusion_matrix': array([[14575,  1050],
       [   20,   355]]), 'sensibility': 0.9466666666666667, 'specificity': 0.9328, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=5,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 20500}




{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.96425, 'confusion_matrix': array([[15096,   529],
       [   43,   332]]), 'sensibility': 0.8853333333333333, 'specificity': 0.966144, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=5,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 26790}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.9844375, 'confusion_matrix': array([[15483,   142],
       [  107,   268]]), 'sensibility': 0.7146666666666667, 'specificity': 0.990912, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=5,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 54920}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.9865625, 'confusion_matrix': array([[15506,   119],
       [   96,   279]]), 'sensibility': 0.744, 'specificity': 0.992384, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=5,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 49190}
{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.93025, 'confusion_matrix': array([[14533,  1092],
       [   24,   351]]), 'sensibility': 0.936, 'specificity': 0.930112, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=10,
       



{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.963875, 'confusion_matrix': array([[15088,   537],
       [   41,   334]]), 'sensibility': 0.8906666666666667, 'specificity': 0.965632, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=10,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 25870}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.985375, 'confusion_matrix': array([[15486,   139],
       [   95,   280]]), 'sensibility': 0.7466666666666667, 'specificity': 0.991104, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=10,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 48890}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.98675, 'confusion_matrix': array([[15499,   126],
       [   86,   289]]), 'sensibility': 0.7706666666666667, 'specificity': 0.991936, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=10,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 44260}
{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.9355, 'confusion_matrix': array([[14621,  1004],
       [   28,   347]]), 'sensibility': 0.9253333333333333, 'specificity': 0.935744, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_s



{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.965375, 'confusion_matrix': array([[15118,   507],
       [   47,   328]]), 'sensibility': 0.8746666666666667, 'specificity': 0.967552, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=15,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 28570}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.98425, 'confusion_matrix': array([[15477,   148],
       [  104,   271]]), 'sensibility': 0.7226666666666667, 'specificity': 0.990528, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=15,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 53480}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.987, 'confusion_matrix': array([[15507,   118],
       [   90,   285]]), 'sensibility': 0.76, 'specificity': 0.992448, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=15,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 46180}
{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.9400625, 'confusion_matrix': array([[14694,   931],
       [   28,   347]]), 'sensibility': 0.9253333333333333, 'specificity': 0.940416, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=



{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.9655, 'confusion_matrix': array([[15116,   509],
       [   43,   332]]), 'sensibility': 0.8853333333333333, 'specificity': 0.967424, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=20,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 26590}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.984, 'confusion_matrix': array([[15476,   149],
       [  107,   268]]), 'sensibility': 0.7146666666666667, 'specificity': 0.990464, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=20,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 54990}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.98725, 'confusion_matrix': array([[15506,   119],
       [   85,   290]]), 'sensibility': 0.7733333333333333, 'specificity': 0.992384, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=20,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 43690}
{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.943375, 'confusion_matrix': array([[14748,   877],
       [   29,   346]]), 'sensibility': 0.9226666666666666, 'specificity': 0.943872, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min



{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.9640625, 'confusion_matrix': array([[15092,   533],
       [   42,   333]]), 'sensibility': 0.888, 'specificity': 0.965888, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=25,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 26330}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.982625, 'confusion_matrix': array([[15454,   171],
       [  107,   268]]), 'sensibility': 0.7146666666666667, 'specificity': 0.989056, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=25,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 55210}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.9868125, 'confusion_matrix': array([[15503,   122],
       [   89,   286]]), 'sensibility': 0.7626666666666667, 'specificity': 0.992192, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=25,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 45720}
{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.9400625, 'confusion_matrix': array([[14696,   929],
       [   30,   345]]), 'sensibility': 0.92, 'specificity': 0.940544, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_sp



{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.9635, 'confusion_matrix': array([[15086,   539],
       [   45,   330]]), 'sensibility': 0.88, 'specificity': 0.965504, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=30,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 27890}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.9833125, 'confusion_matrix': array([[15459,   166],
       [  101,   274]]), 'sensibility': 0.7306666666666667, 'specificity': 0.989376, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=30,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 52160}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.9869375, 'confusion_matrix': array([[15501,   124],
       [   85,   290]]), 'sensibility': 0.7733333333333333, 'specificity': 0.992064, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=30,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 43740}
{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.9453125, 'confusion_matrix': array([[14782,   843],
       [   32,   343]]), 'sensibility': 0.9146666666666666, 'specificity': 0.946048, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, 



{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.9664375, 'confusion_matrix': array([[15138,   487],
       [   50,   325]]), 'sensibility': 0.8666666666666667, 'specificity': 0.968832, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=35,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 29870}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.9821875, 'confusion_matrix': array([[15449,   176],
       [  109,   266]]), 'sensibility': 0.7093333333333334, 'specificity': 0.988736, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=35,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 56260}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.9859375, 'confusion_matrix': array([[15486,   139],
       [   86,   289]]), 'sensibility': 0.7706666666666667, 'specificity': 0.991104, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=35,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 44390}
{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.9365, 'confusion_matrix': array([[14635,   990],
       [   26,   349]]), 'sensibility': 0.9306666666666666, 'specificity': 0.93664, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_



{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.9728125, 'confusion_matrix': array([[15241,   384],
       [   51,   324]]), 'sensibility': 0.864, 'specificity': 0.975424, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=40,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 29340}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.98275, 'confusion_matrix': array([[15450,   175],
       [  101,   274]]), 'sensibility': 0.7306666666666667, 'specificity': 0.9888, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=40,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 52250}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.985375, 'confusion_matrix': array([[15478,   147],
       [   87,   288]]), 'sensibility': 0.768, 'specificity': 0.990592, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=40,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 44970}
{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.9355, 'confusion_matrix': array([[14618,  1007],
       [   25,   350]]), 'sensibility': 0.9333333333333333, 'specificity': 0.935552, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split



{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.973625, 'confusion_matrix': array([[15255,   370],
       [   52,   323]]), 'sensibility': 0.8613333333333333, 'specificity': 0.97632, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=45,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 29700}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.9825, 'confusion_matrix': array([[15446,   179],
       [  101,   274]]), 'sensibility': 0.7306666666666667, 'specificity': 0.988544, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=45,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 52290}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.9853125, 'confusion_matrix': array([[15472,   153],
       [   82,   293]]), 'sensibility': 0.7813333333333333, 'specificity': 0.990208, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=45,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 42530}
{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.934625, 'confusion_matrix': array([[14600,  1025],
       [   21,   354]]), 'sensibility': 0.944, 'specificity': 0.9344, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_spli



{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.973625, 'confusion_matrix': array([[15255,   370],
       [   52,   323]]), 'sensibility': 0.8613333333333333, 'specificity': 0.97632, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=50,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 29700}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.981625, 'confusion_matrix': array([[15432,   193],
       [  101,   274]]), 'sensibility': 0.7306666666666667, 'specificity': 0.987648, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=50,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 52430}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.985125, 'confusion_matrix': array([[15467,   158],
       [   80,   295]]), 'sensibility': 0.7866666666666666, 'specificity': 0.989888, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=50,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 41580}
{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.9221875, 'confusion_matrix': array([[14400,  1225],
       [   20,   355]]), 'sensibility': 0.9466666666666667, 'specificity': 0.9216, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min



{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.9569375, 'confusion_matrix': array([[14955,   670],
       [   19,   356]]), 'sensibility': 0.9493333333333334, 'specificity': 0.95712, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=100,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 16200}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.9793125, 'confusion_matrix': array([[15383,   242],
       [   89,   286]]), 'sensibility': 0.7626666666666667, 'specificity': 0.984512, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=100,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 46920}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.9834375, 'confusion_matrix': array([[15443,   182],
       [   83,   292]]), 'sensibility': 0.7786666666666666, 'specificity': 0.988352, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=100,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 43320}
{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.9165, 'confusion_matrix': array([[14300,  1325],
       [   11,   364]]), 'sensibility': 0.9706666666666667, 'specificity': 0.9152, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_



{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.9370625, 'confusion_matrix': array([[14632,   993],
       [   14,   361]]), 'sensibility': 0.9626666666666667, 'specificity': 0.936448, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=200,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 16930}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.978375, 'confusion_matrix': array([[15366,   259],
       [   87,   288]]), 'sensibility': 0.768, 'specificity': 0.983424, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=200,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 46090}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.9831875, 'confusion_matrix': array([[15433,   192],
       [   77,   298]]), 'sensibility': 0.7946666666666666, 'specificity': 0.987712, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=200,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 40420}
{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.9165, 'confusion_matrix': array([[14300,  1325],
       [   11,   364]]), 'sensibility': 0.9706666666666667, 'specificity': 0.9152, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_



{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.9380625, 'confusion_matrix': array([[14646,   979],
       [   12,   363]]), 'sensibility': 0.968, 'specificity': 0.937344, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=300,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 15790}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.975, 'confusion_matrix': array([[15311,   314],
       [   86,   289]]), 'sensibility': 0.7706666666666667, 'specificity': 0.979904, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=300,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 46140}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.9838125, 'confusion_matrix': array([[15450,   175],
       [   84,   291]]), 'sensibility': 0.776, 'specificity': 0.9888, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=300,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 43750}
{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.9165, 'confusion_matrix': array([[14300,  1325],
       [   11,   364]]), 'sensibility': 0.9706666666666667, 'specificity': 0.9152, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=4



{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.9380625, 'confusion_matrix': array([[14646,   979],
       [   12,   363]]), 'sensibility': 0.968, 'specificity': 0.937344, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=400,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 15790}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.973875, 'confusion_matrix': array([[15288,   337],
       [   81,   294]]), 'sensibility': 0.784, 'specificity': 0.978432, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=400,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 43870}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.98075, 'confusion_matrix': array([[15385,   240],
       [   68,   307]]), 'sensibility': 0.8186666666666667, 'specificity': 0.98464, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=400,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 36400}
{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.9165, 'confusion_matrix': array([[14300,  1325],
       [   11,   364]]), 'sensibility': 0.9706666666666667, 'specificity': 0.9152, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_sam



{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.9370625, 'confusion_matrix': array([[14630,   995],
       [   12,   363]]), 'sensibility': 0.968, 'specificity': 0.93632, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=500,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 15950}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.966125, 'confusion_matrix': array([[15162,   463],
       [   79,   296]]), 'sensibility': 0.7893333333333333, 'specificity': 0.970368, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=500,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 44130}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.979, 'confusion_matrix': array([[15352,   273],
       [   63,   312]]), 'sensibility': 0.832, 'specificity': 0.982528, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=500,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 34230}
{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.9165, 'confusion_matrix': array([[14300,  1325],
       [   11,   364]]), 'sensibility': 0.9706666666666667, 'specificity': 0.9152, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=600



{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.937625, 'confusion_matrix': array([[14632,   993],
       [    5,   370]]), 'sensibility': 0.9866666666666667, 'specificity': 0.936448, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=600,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 12430}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.9654375, 'confusion_matrix': array([[15147,   478],
       [   75,   300]]), 'sensibility': 0.8, 'specificity': 0.969408, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=600,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 42280}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.97925, 'confusion_matrix': array([[15351,   274],
       [   58,   317]]), 'sensibility': 0.8453333333333334, 'specificity': 0.982464, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=600,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 31740}
{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.9165, 'confusion_matrix': array([[14300,  1325],
       [   11,   364]]), 'sensibility': 0.9706666666666667, 'specificity': 0.9152, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_sa



{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.9376875, 'confusion_matrix': array([[14633,   992],
       [    5,   370]]), 'sensibility': 0.9866666666666667, 'specificity': 0.936512, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=700,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 12420}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.965375, 'confusion_matrix': array([[15141,   484],
       [   70,   305]]), 'sensibility': 0.8133333333333334, 'specificity': 0.969024, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=700,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 39840}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.978, 'confusion_matrix': array([[15322,   303],
       [   49,   326]]), 'sensibility': 0.8693333333333333, 'specificity': 0.980608, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=700,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 27530}
{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.9165, 'confusion_matrix': array([[14300,  1325],
       [   11,   364]]), 'sensibility': 0.9706666666666667, 'specificity': 0.9152, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samp



{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.9374375, 'confusion_matrix': array([[14629,   996],
       [    5,   370]]), 'sensibility': 0.9866666666666667, 'specificity': 0.936256, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=800,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 12460}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.9638125, 'confusion_matrix': array([[15115,   510],
       [   69,   306]]), 'sensibility': 0.816, 'specificity': 0.96736, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=800,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 39600}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.976875, 'confusion_matrix': array([[15305,   320],
       [   50,   325]]), 'sensibility': 0.8666666666666667, 'specificity': 0.97952, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=800,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 28200}
{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.9164375, 'confusion_matrix': array([[14297,  1328],
       [    9,   366]]), 'sensibility': 0.976, 'specificity': 0.915008, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_sp



{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.936625, 'confusion_matrix': array([[14616,  1009],
       [    5,   370]]), 'sensibility': 0.9866666666666667, 'specificity': 0.935424, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=900,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 12590}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.9635625, 'confusion_matrix': array([[15108,   517],
       [   66,   309]]), 'sensibility': 0.824, 'specificity': 0.966912, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=900,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 38170}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.97675, 'confusion_matrix': array([[15302,   323],
       [   49,   326]]), 'sensibility': 0.8693333333333333, 'specificity': 0.979328, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=900,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 27730}
{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.92875, 'confusion_matrix': array([[14502,  1123],
       [   17,   358]]), 'sensibility': 0.9546666666666667, 'specificity': 0.928128, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min



{'predicted': array([0, 0, 1, ..., 0, 0, 0]), 'accuracy': 0.937625, 'confusion_matrix': array([[14632,   993],
       [    5,   370]]), 'sensibility': 0.9866666666666667, 'specificity': 0.936448, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=1000,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 12430}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.96375, 'confusion_matrix': array([[15110,   515],
       [   65,   310]]), 'sensibility': 0.8266666666666667, 'specificity': 0.96704, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=1000,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 37650}




{'predicted': array([0, 0, 0, ..., 0, 0, 0]), 'accuracy': 0.9741875, 'confusion_matrix': array([[15260,   365],
       [   48,   327]]), 'sensibility': 0.872, 'specificity': 0.97664, 'clf': DecisionTreeClassifier(class_weight=None, criterion='gini', max_depth=None,
            max_features=None, max_leaf_nodes=None,
            min_impurity_decrease=0.0, min_impurity_split=None,
            min_samples_leaf=1, min_samples_split=1000,
            min_weight_fraction_leaf=0.0, presort=False, random_state=None,
            splitter='best'), 'score': 27650}


In [12]:
plt.figure(figsize=(16,6))
filename = 'dt_balancing'
#measures = pd.DataFrame.from_dict(measures, "index")
#measures.to_csv('plot_data/{}.csv'.format(filename))
    
g = sns.FacetGrid(measures, hue="Technique", size=8)
g = g.map(plt.scatter, "Min Samples to Split", "Price").add_legend()
g = g.map(plt.plot, "Min Samples to Split", "Price")
g.axes[0,0].set_ylim(ymin=0)

plt.savefig('images/{}.pdf'.format(filename))
plt.clf()



<Figure size 1152x432 with 0 Axes>

<Figure size 724.975x576 with 0 Axes>