# Prerequisite

Following packages must be installed to run codes below

```bash
$ pip3 install openpyxl 
```


In [1]:
%load_ext autoreload
%autoreload 2

# Add project path

In [2]:
import os
import sys
from pathlib import Path

PROJECT_PATH = Path().resolve().parent.parent
SRC_PATH = PROJECT_PATH / 'src'

sys.path.append(str(SRC_PATH))

In [3]:
exp_name = 'feature_selection_v3'

In [4]:
from project_paths import DATA_PATH
import pandas as pd

EXP_RESULT_PATH = DATA_PATH / 'experiment_result' / 'feature_selection_v2'

aggregated_result_path = EXP_RESULT_PATH / 'result.csv'

v2_exp_result = pd.read_csv(aggregated_result_path)

In [5]:
sectors = [
    '제조업(10~34)',
    '부동산업(68)',
    '도매 및 소매업(45~47)',
    '숙박 및 음식점업(55~56)',
    '건설업(41~42)'
]
years_to_close = [
    'Closed_In_1Yr',
    'Closed_In_2Yrs',
]

In [6]:
best_features = {}

for sector in sectors : 
    best_features[sector] = {}

for sector in sectors : 
    for target_years_to_close in years_to_close : 
        best_features[sector][target_years_to_close] = (
            v2_exp_result
            .loc[lambda x : x['대분류']==sector]
            .loc[lambda x : x['Fold']=='Mean']
            .loc[lambda x : x['target']==target_years_to_close]
            .set_index('feature_selection')
            ['AUC'].idxmax()
        )

In [17]:
from pprint import pprint
pprint(best_features)

{'건설업(41~42)': {'Closed_In_1Yr': "['순운전자본/자산총계', '유동부채/유동자산', '유형자산', '자본금', "
                                 "'유보액/총자산(%)', '유보액/납입자본(%)', '차입금의존도(%)', "
                                 "'총자본회전율(회)', '매출채권회전율(회)', '매입채무회전율(회)', "
                                 "'Closed_In_1Yr']",
                'Closed_In_2Yrs': "['매출채권', '비유동자산', '유형자산', '판매비와관리비', "
                                  "'기업순이익률(%)', '매출액총이익률(%)', '경상수지비율', "
                                  "'차입금의존도(%)', '유동부채비율(%)', '미수금', "
                                  "'Closed_In_2Yrs']"},
 '도매 및 소매업(45~47)': {'Closed_In_1Yr': "['유동자산/부채총계', '순운전자본/자산총계', '유동자산', "
                                      "'유형자산', '자산총계', '유동부채', '이익잉여금(결손금）', "
                                      "'매출액총이익률(%)', '경상수지비율', '매입채무회전율(회)', "
                                      "'Closed_In_1Yr']",
                     'Closed_In_2Yrs': "['당기순이익(손실)/자산총계', '순운전자본/자산총계', "
                                       "'매출채권', '비유동자산', '유형자산', '판매비와관

In [7]:
additional_features = {
    '제조업(10~34)' : [
        '3YEAR TREASURY',
        '5YEAR TREASURY',
        '10YEAR TREASURY',
        '3YEAR COPORATE BOND',
        'CD 91DAYS',
        'CALL RATE 1DAY',
        'BASE RATE',
        'DOW_JONES_COMMODITY_INDEX_PRICE',
        'DOW_JONES_COMMODITY_INDEX_CHANGE_RATE',
        'EXCHANGE_RATE_PRICE',
        'EXCHANGE_RATE_CHANGE_RATE',
    ],
    '부동산업(68)' : [
        'NATIONWIDE',
        'CAPITAL AREA',
        'NON CAPITAL AREA'
    ],
    '도매 및 소매업(45~47)' : [
        'CSI',
        'CCI',
        'CLI'
    ],
    '숙박 및 음식점업(55~56)' : [
        'CSI',
        'CCI',
        'CLI'
    ],
    '건설업(41~42)' : [
        '3YEAR TREASURY',
        '5YEAR TREASURY',
        '10YEAR TREASURY',
        '3YEAR COPORATE BOND',
        'CD 91DAYS',
        'CALL RATE 1DAY',
        'BASE RATE',
        'DOW_JONES_COMMODITY_INDEX_PRICE',
        'DOW_JONES_COMMODITY_INDEX_CHANGE_RATE',
        'EXCHANGE_RATE_PRICE',
        'EXCHANGE_RATE_CHANGE_RATE',
    ]
}

# Load data

In [8]:
from data_loader import SectorDataLoader

data_loader = SectorDataLoader()
data_finance = (
    data_loader
    .load_dataset()
    .pipe(data_loader.add_beaver_indicator)
    .pipe(data_loader.add_label)
)
data_finance.head()

Unnamed: 0,BIZ_NO,CMP_PFIX_NM,CMP_NM,CMP_NM1,CMP_SFIX_NM,CMP_ENM,BZ_TYP,CMP_TYP,CMP_SCL,PBCO_GB,...,STAT_OCR_DATE_y,Closed_Year,유동자산/부채총계,당기순이익(손실)/자산총계,부채총계/자산총계,순운전자본/자산총계,유동부채/유동자산,Years_From_Closed_Year_To_FS,Closed_In_1Yr,Closed_In_2Yrs
117,1018135422,(주),한국선박기술,,,Korea Marine Time Service,M,,2,2,...,20200930.0,2020.0,1.031451,0.038773,0.578094,0.543045,0.089273,2.0,0,1
219,1018154206,(주),드림미즈,,,"dreammiz Co., Ltd.",M,,2,2,...,20201231.0,2020.0,1.22004,0.001177,0.662356,0.608449,0.247063,2.0,0,1
279,1018163684,,디에프에스서울,,(주),DFS Seoul Ltd.,M,,2,2,...,20190917.0,2019.0,11.012914,0.046666,0.090794,0.909114,0.090802,1.0,1,1
339,1018178760,(주),대교디앤씨,,,"DAEGYO D & C CO.,LTD.",M,,2,2,...,20191010.0,2019.0,0.916364,-0.026128,1.091269,0.097514,0.902486,1.0,1,1
406,1018194173,,에코에너지,,(주),"Eco Energy Co.,Ltd.",M,,2,2,...,20200831.0,2020.0,1.183355,-0.062095,0.828142,0.194625,0.8014,2.0,0,1


In [9]:
from data_loader import IndexDataLoader
import pandas as pd
import ast

"""
index_features = [
    '3YEAR TREASURY',
    '5YEAR TREASURY',
    '10YEAR TREASURY',
    '3YEAR COPORATE BOND',
    'CD 91DAYS',
    'CALL RATE 1DAY',
    'BASE RATE',
    'YEAR_MONTH',
    'DOW_JONES_COMMODITY_INDEX_PRICE',
    'DOW_JONES_COMMODITY_INDEX_CHANGE_RATE',
    'EXCHANGE_RATE_PRICE',
    'EXCHANGE_RATE_CHANGE_RATE',
    'NATIONWIDE',
    'CAPITAL AREA',
    'NON CAPITAL AREA',
    'CSI',
    'CCI',
    'CLI',
]
"""
index_features = [
     '3YEAR TREASURY',
     '5YEAR TREASURY',
     '10YEAR TREASURY',
     '3YEAR COPORATE BOND',
     'CD 91DAYS',
     'CALL RATE 1DAY',
     'BASE RATE',
     'YEAR_MONTH',
     'DOW_JONES_COMMODITY_INDEX_PRICE',
     'DOW_JONES_COMMODITY_INDEX_CHANGE_RATE',
     'EXCHANGE_RATE_PRICE',
     'EXCHANGE_RATE_CHANGE_RATE',
     'NATIONWIDE',
     'CAPITAL AREA',
     'NON CAPITAL AREA',
     'CSI',
     'CCI',
     'CLI',
]

index_data_loader = IndexDataLoader()

index_data = (
    index_data_loader.load_interest_rate()
    .merge(
        (
            index_data_loader.load_dow_jones_commodity_index()
            .rename(columns={'PRICE':'DOW_JONES_COMMODITY_INDEX_PRICE',
                            'CHANGE_RATE':'DOW_JONES_COMMODITY_INDEX_CHANGE_RATE'})
        ),
        how='outer',
        left_on='YEAR_MONTH',
        right_on='YEAR_MONTH'
    )
    .merge(
        (
            index_data_loader.load_exchange_rate()
            .rename(columns={'PRICE':'EXCHANGE_RATE_PRICE',
                            'CHANGE_RATE':'EXCHANGE_RATE_CHANGE_RATE'})
        ),
        how='outer',
        left_on='YEAR_MONTH',
        right_on='YEAR_MONTH'
    )
    .merge(
        (
            index_data_loader.load_apartment_housing_index()
        ),
        how='outer',
        left_on='YEAR_MONTH',
        right_on='YEAR_MONTH'
        
    )
    .merge(
        (
            index_data_loader.load_csi()
        ),
        how='outer',
        left_on='YEAR_MONTH',
        right_on='YEAR_MONTH'
    )
    .merge(
        (
            index_data_loader.load_composite_index()
            .rename(columns={'PRICE':'DOW_JONES_COMMODITY_INDEX_PRICE',
                            'CHANGE_RATE':'DOW_JONES_COMMODITY_INDEX_CHANGE_RATE'})
        ),
        how='outer',
        left_on='YEAR_MONTH',
        right_on='YEAR_MONTH'
    )
    .assign(year=lambda x : x['YEAR_MONTH'].dt.year)
    .assign(month=lambda x : x['YEAR_MONTH'].dt.month)
    .groupby(['year'])
    [index_features].mean()
    .reset_index(drop=False)
)

index_data

Unnamed: 0,year,3YEAR TREASURY,5YEAR TREASURY,10YEAR TREASURY,3YEAR COPORATE BOND,CD 91DAYS,CALL RATE 1DAY,BASE RATE,DOW_JONES_COMMODITY_INDEX_PRICE,DOW_JONES_COMMODITY_INDEX_CHANGE_RATE,EXCHANGE_RATE_PRICE,EXCHANGE_RATE_CHANGE_RATE,NATIONWIDE,CAPITAL AREA,NON CAPITAL AREA,CSI,CCI,CLI
0,2006,,,,,,,,,,,,63.841667,68.6,58.416667,,,
1,2007,,,,,,,,,,,,72.758333,82.441667,60.925,,,
2,2008,,,,,,,,,,,,76.775,89.15,62.991667,,,
3,2009,,,,,,,,,,,,76.058333,87.833333,64.2,,,
4,2010,,,,,,,,,,,,77.733333,86.833333,69.516667,,,
5,2011,,,,,,,,,,,,83.7,86.85,80.983333,,,
6,2012,,,,,,,,,,,,83.883333,81.891667,85.25,,,
7,2013,,,,,,,,,,,,84.325,80.333333,87.125,,,
8,2014,,,,,,,,,,,,88.008333,83.366667,91.325,,,
9,2015,,,,,,,,,,,,94.008333,89.175,97.658333,,,


In [10]:
data = (
    data_finance
    .assign(year=lambda x : x['결산년월'].astype(str).str[:4].astype(int))
    .merge(
        index_data,
        how='left',
        left_on='year',
        right_on='year'
    )
)
data

Unnamed: 0,BIZ_NO,CMP_PFIX_NM,CMP_NM,CMP_NM1,CMP_SFIX_NM,CMP_ENM,BZ_TYP,CMP_TYP,CMP_SCL,PBCO_GB,...,DOW_JONES_COMMODITY_INDEX_PRICE,DOW_JONES_COMMODITY_INDEX_CHANGE_RATE,EXCHANGE_RATE_PRICE,EXCHANGE_RATE_CHANGE_RATE,NATIONWIDE,CAPITAL AREA,NON CAPITAL AREA,CSI,CCI,CLI
0,1018135422,(주),한국선박기술,,,Korea Marine Time Service,M,,2,2,...,625.940833,-0.695000,1098.985000,0.372500,100.608333,104.325000,97.441667,104.083333,101.425000,100.058333
1,1018154206,(주),드림미즈,,,"dreammiz Co., Ltd.",M,,2,2,...,625.940833,-0.695000,1098.985000,0.372500,100.608333,104.325000,97.441667,104.083333,101.425000,100.058333
2,1018163684,,디에프에스서울,,(주),DFS Seoul Ltd.,M,,2,2,...,625.940833,-0.695000,1098.985000,0.372500,100.608333,104.325000,97.441667,104.083333,101.425000,100.058333
3,1018178760,(주),대교디앤씨,,,"DAEGYO D & C CO.,LTD.",M,,2,2,...,625.940833,-0.695000,1098.985000,0.372500,100.608333,104.325000,97.441667,104.083333,101.425000,100.058333
4,1018194173,,에코에너지,,(주),"Eco Energy Co.,Ltd.",M,,2,2,...,625.940833,-0.695000,1098.985000,0.372500,100.608333,104.325000,97.441667,104.083333,101.425000,100.058333
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
10516,8998700283,(주),덕성건설,,,Deokseong Construction,M,,2,2,...,625.940833,-0.695000,1098.985000,0.372500,100.608333,104.325000,97.441667,104.083333,101.425000,100.058333
10517,8998700283,(주),덕성건설,,,Deokseong Construction,M,,2,2,...,614.237500,0.997500,1164.787500,0.317500,100.108333,107.183333,94.075000,99.083333,100.258333,98.475000
10518,8998701263,,하나머스트제6호기업인수목적,,(주),HANA MUST SIXTH SPECIAL PURPOSE ACQUISITION CO...,M,,2,2,...,625.940833,-0.695000,1098.985000,0.372500,100.608333,104.325000,97.441667,104.083333,101.425000,100.058333
10519,8998701263,,하나머스트제6호기업인수목적,,(주),HANA MUST SIXTH SPECIAL PURPOSE ACQUISITION CO...,M,,2,2,...,614.237500,0.997500,1164.787500,0.317500,100.108333,107.183333,94.075000,99.083333,100.258333,98.475000


# Baseline classifier using Beaver's features

In [11]:
from project_paths import DATA_PATH

sectors = [
    '제조업(10~34)',
    '부동산업(68)',
    '도매 및 소매업(45~47)',
    '숙박 및 음식점업(55~56)',
    '건설업(41~42)'
]

beaver_features = [
    '유동자산/부채총계',
    '당기순이익(손실)/자산총계',
    '부채총계/자산총계',
    '순운전자본/자산총계',
    '유동부채/유동자산'
]

extended_financial_features = [
    '유동자산',
    '매출채권',
    '비유동자산',
    '유형자산',
    '자산총계',
    '유동부채',
    '비유동부채',
    '부  채  총  계',
    '자본금',
    '이익잉여금(결손금）',
    '자본총계',
    '매출액',
    '판매비와관리비',
    '영업이익（손실）',
    '법인세비용차감전순손익',
    '법인세비용',
    '당기순이익(손실)',
    '기업순이익률(%)',
    '유보액/총자산(%)',
    '유보액/납입자본(%)',
    '매출액총이익률(%)',
    '매출액영업이익률(%)',
    '매출액순이익률(%)',
    '수지비율(%)',
    '경상수지비율',
    '영업비율(%)',
    '금융비용대매출액비율(%',
    '금융비용대부채비율(%)',
    '금융비용대총비용비율(%',
    '부채비율(%)',
    '차입금의존도(%)',
    '자기자본비율(%)',
    '순운전자본비율(%)',
    '유동부채비율(%)',
    '비유동부채비율(%)',
    '부채총계대 매출액(%)',
    '총자본회전율(회)',
    '재고자산회전율(회)',
    '매출채권회전율(회)',
    '매입채무회전율(회)',
    '미수금',
    '매출원가',
    '무형자산',
    '재고자산',
]

years_to_close = [
    'Closed_In_1Yr',
    'Closed_In_2Yrs',
]

x_data_year = list(range(2018, 2020))

EXP_RESULT_PATH = DATA_PATH / 'experiment_result' / exp_name

if not os.path.exists(EXP_RESULT_PATH) : 
    os.mkdir(EXP_RESULT_PATH)

In [12]:
import numpy as np
import pandas as pd
from pycaret.classification import ClassificationExperiment
from tqdm import tqdm

In [13]:
exp_result = None

for target_years_to_close in tqdm(years_to_close) : 
    for x_data_target_year in tqdm(x_data_year, leave=True) : 
        for sector in sectors : 

            filename = EXP_RESULT_PATH / f'Beaver_baseline_{sector}_{target_years_to_close}_{x_data_target_year}.csv'

            if not os.path.exists(filename) : 

                data_to_train = (
                    data
                    .loc[~data[beaver_features[0]].isin([np.nan, np.inf, -np.inf]), :]
                    .loc[~data[beaver_features[1]].isin([np.nan, np.inf, -np.inf]), :]
                    .loc[~data[beaver_features[2]].isin([np.nan, np.inf, -np.inf]), :]
                    .loc[~data[beaver_features[3]].isin([np.nan, np.inf, -np.inf]), :]
                    .loc[~data[beaver_features[4]].isin([np.nan, np.inf, -np.inf]), :]
                    .loc[lambda x : pd.to_datetime(x['결산년월'], format='%Y%m%d').dt.year==x_data_target_year]
                    .loc[lambda x : x['대분류']==sector]
                )

                exp = ClassificationExperiment()

                target_features = (
                    [x for x in ast.literal_eval(best_features[sector][target_years_to_close]) if 'Closed' not in x]
                    + additional_features[sector]
                    + [target_years_to_close]
                )
                              
                exp.setup(
                    (
                        data_to_train
                        .loc[:, target_features]
                        .reset_index(drop=True)
                        .fillna(0)
                    ),
                    target=target_years_to_close,
                    #feature_selection=True,
                    #remove_multicollinearity = True,
                )

                models = exp.compare_models(sort='AUC', n_select=3)
                tuned_models = [exp.tune_model(x) for x in models]
                
                #if target_years_to_close == 'Closed_In_1Yr' :
                blended_model = exp.blend_models(estimator_list=tuned_models, fold=5, method = 'soft')
                result = (
                    exp.pull()
                    .assign(target=target_years_to_close)
                    .assign(x_data_yaer=x_data_target_year)
                    .assign(대분류=sector)
                    .reset_index(drop=False)
                    .rename(columns={'index':'model_name'})
                )
                result['feature_selection'] = str(exp.dataset_transformed.columns.tolist())
                result.to_csv(filename)

            else : 
                result = pd.read_csv(filename)

            if exp_result is None : 
                exp_result = result
            else : 
                exp_result = pd.concat([exp_result, result], axis=0)

  0%|                                                                                                                                                                                                                   | 0/2 [00:00<?, ?it/s]
  0%|                                                                                                                                                                                                                   | 0/2 [00:00<?, ?it/s][A

Unnamed: 0,Description,Value
0,Session id,8686
1,Target,Closed_In_1Yr
2,Target type,Binary
3,Original data shape,"(1800, 22)"
4,Transformed data shape,"(1800, 11)"
5,Transformed train set shape,"(1259, 11)"
6,Transformed test set shape,"(541, 11)"
7,Numeric features,21
8,Preprocess,True
9,Imputation type,simple


Unnamed: 0,Model,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC,TT (Sec)
rf,Random Forest Classifier,0.8713,0.6766,0.1096,0.5517,0.1778,0.1409,0.1967,0.094
nb,Naive Bayes,0.857,0.6442,0.1029,0.3119,0.1514,0.0996,0.1167,0.005
et,Extra Trees Classifier,0.8745,0.6431,0.121,0.5983,0.1953,0.1597,0.221,0.068
lightgbm,Light Gradient Boosting Machine,0.8697,0.6383,0.1397,0.4702,0.2112,0.1661,0.2027,0.049
gbc,Gradient Boosting Classifier,0.8642,0.6369,0.086,0.365,0.1349,0.0962,0.1251,0.062
lda,Linear Discriminant Analysis,0.8649,0.6338,0.036,0.2667,0.0622,0.0391,0.0609,0.007
knn,K Neighbors Classifier,0.8602,0.6124,0.0662,0.27,0.1053,0.0655,0.0841,0.014
ada,Ada Boost Classifier,0.8665,0.6084,0.1096,0.4708,0.1725,0.1303,0.1742,0.027
qda,Quadratic Discriminant Analysis,0.8149,0.6047,0.1456,0.219,0.1681,0.0703,0.0745,0.006
dt,Decision Tree Classifier,0.7983,0.5882,0.2871,0.258,0.2679,0.153,0.1548,0.008


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.8651,0.4778,0.0,0.0,0.0,-0.0152,-0.0341
1,0.873,0.6852,0.0,0.0,0.0,0.0,0.0
2,0.881,0.6608,0.0625,1.0,0.1176,0.1043,0.2345
3,0.8889,0.7693,0.125,1.0,0.2222,0.1996,0.333
4,0.881,0.6557,0.0625,1.0,0.1176,0.1043,0.2345
5,0.881,0.762,0.1176,1.0,0.2105,0.1874,0.3216
6,0.873,0.7205,0.1176,0.6667,0.2,0.1663,0.2431
7,0.8651,0.6236,0.0,0.0,0.0,0.0,0.0
8,0.881,0.7232,0.1176,1.0,0.2105,0.1874,0.3216
9,0.872,0.5986,0.0,0.0,0.0,0.0,0.0


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.8571,0.4682,0.0,0.0,0.0,-0.029,-0.0484
1,0.873,0.633,0.1875,0.5,0.2727,0.2186,0.2505
2,0.873,0.7199,0.0625,0.5,0.1111,0.0853,0.1423
3,0.8651,0.6403,0.0625,0.3333,0.1053,0.0679,0.0968
4,0.873,0.5994,0.0625,0.5,0.1111,0.0853,0.1423
5,0.873,0.7366,0.1765,0.6,0.2727,0.2252,0.2767
6,0.8333,0.7507,0.0588,0.1667,0.087,0.0178,0.0208
7,0.881,0.6317,0.1765,0.75,0.2857,0.247,0.326
8,0.8492,0.6352,0.0,0.0,0.0,-0.0292,-0.0502
9,0.848,0.6365,0.0625,0.2,0.0952,0.0365,0.044


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.873,0.452,0.0,0.0,0.0,0.0,0.0
1,0.873,0.6497,0.0,0.0,0.0,0.0,0.0
2,0.873,0.7267,0.0,0.0,0.0,0.0,0.0
3,0.873,0.598,0.0,0.0,0.0,0.0,0.0
4,0.873,0.6,0.0,0.0,0.0,0.0,0.0
5,0.8651,0.731,0.0,0.0,0.0,0.0,0.0
6,0.8651,0.7358,0.0,0.0,0.0,0.0,0.0
7,0.8651,0.6538,0.0,0.0,0.0,0.0,0.0
8,0.8651,0.6363,0.0,0.0,0.0,0.0,0.0
9,0.872,0.6585,0.0,0.0,0.0,0.0,0.0


Fitting 10 folds for each of 10 candidates, totalling 100 fits
Original model was better than the tuned model, hence it will be returned. NOTE: The display metrics are for the tuned model (not the original one).


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.8294,0.5741,0.1212,0.2222,0.1569,0.071,0.075
1,0.881,0.6657,0.1515,0.7143,0.25,0.214,0.2923
2,0.8889,0.7109,0.1515,1.0,0.2632,0.2369,0.3665
3,0.8849,0.6781,0.1515,0.8333,0.2564,0.2252,0.3252
4,0.8645,0.6511,0.0625,0.3333,0.1053,0.0677,0.0966
Mean,0.8697,0.656,0.1277,0.6206,0.2063,0.1629,0.2311
Std,0.0218,0.0455,0.0346,0.2964,0.0637,0.0768,0.1211


Unnamed: 0,Description,Value
0,Session id,4096
1,Target,Closed_In_1Yr
2,Target type,Binary
3,Original data shape,"(323, 14)"
4,Transformed data shape,"(323, 11)"
5,Transformed train set shape,"(226, 11)"
6,Transformed test set shape,"(97, 11)"
7,Numeric features,13
8,Preprocess,True
9,Imputation type,simple


Unnamed: 0,Model,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC,TT (Sec)
lightgbm,Light Gradient Boosting Machine,0.8142,0.7734,0.41,0.6662,0.469,0.3686,0.402,0.007
ada,Ada Boost Classifier,0.8229,0.7634,0.405,0.7162,0.4876,0.3912,0.4301,0.015
rf,Random Forest Classifier,0.8279,0.7344,0.37,0.7567,0.4661,0.3791,0.4269,0.048
gbc,Gradient Boosting Classifier,0.8144,0.715,0.41,0.6317,0.4753,0.3705,0.3934,0.018
et,Extra Trees Classifier,0.8415,0.7106,0.39,0.7917,0.4952,0.4169,0.464,0.043
dt,Decision Tree Classifier,0.7302,0.6632,0.55,0.4406,0.4705,0.3033,0.3151,0.005
lda,Linear Discriminant Analysis,0.7698,0.6544,0.06,0.175,0.0841,0.0178,0.0211,0.005
knn,K Neighbors Classifier,0.7964,0.6115,0.305,0.5333,0.3673,0.2687,0.2946,0.012
qda,Quadratic Discriminant Analysis,0.3589,0.6113,0.9,0.2329,0.3686,0.0585,0.1233,0.005
nb,Naive Bayes,0.2344,0.5967,1.0,0.2136,0.3516,0.0146,0.0605,0.005


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.7826,0.8,0.2,0.5,0.2857,0.1844,0.2114
1,0.7391,0.7222,0.2,0.3333,0.25,0.1039,0.1089
2,0.7826,0.8222,0.4,0.5,0.4444,0.3114,0.3144
3,0.913,0.8667,0.6,1.0,0.75,0.7013,0.7348
4,0.8261,0.7333,0.2,1.0,0.3333,0.2812,0.4045
5,0.8261,0.7111,0.2,1.0,0.3333,0.2812,0.4045
6,0.8182,0.8353,0.6,0.6,0.6,0.4824,0.4824
7,0.9091,0.8611,0.5,1.0,0.6667,0.6207,0.6708
8,0.8636,0.7222,0.25,1.0,0.4,0.3529,0.4629
9,0.8182,0.7222,0.25,0.5,0.3333,0.2414,0.2609


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.8696,0.8444,0.4,1.0,0.5714,0.5106,0.5855
1,0.8696,0.7444,0.4,1.0,0.5714,0.5106,0.5855
2,0.8261,0.7667,0.4,0.6667,0.5,0.4026,0.4219
3,0.8696,0.8889,0.4,1.0,0.5714,0.5106,0.5855
4,0.8261,0.5778,0.2,1.0,0.3333,0.2812,0.4045
5,0.8261,0.6333,0.2,1.0,0.3333,0.2812,0.4045
6,0.8182,0.8,0.2,1.0,0.3333,0.2787,0.4024
7,0.9091,0.8056,0.5,1.0,0.6667,0.6207,0.6708
8,0.8182,0.7153,0.25,0.5,0.3333,0.2414,0.2609
9,0.8636,0.6806,0.25,1.0,0.4,0.3529,0.4629


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.8696,0.7222,0.4,1.0,0.5714,0.5106,0.5855
1,0.8261,0.6556,0.2,1.0,0.3333,0.2812,0.4045
2,0.8261,0.7333,0.4,0.6667,0.5,0.4026,0.4219
3,0.8261,0.9333,0.2,1.0,0.3333,0.2812,0.4045
4,0.8261,0.6556,0.2,1.0,0.3333,0.2812,0.4045
5,0.8261,0.6667,0.2,1.0,0.3333,0.2812,0.4045
6,0.7727,0.8235,0.2,0.5,0.2857,0.1791,0.2058
7,0.9091,0.8194,0.5,1.0,0.6667,0.6207,0.6708
8,0.8182,0.5833,0.25,0.5,0.3333,0.2414,0.2609
9,0.8636,0.75,0.25,1.0,0.4,0.3529,0.4629


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.8261,0.7778,0.2,1.0,0.3333,0.2812,0.4045
1,0.8667,0.82,0.4,1.0,0.5714,0.5091,0.5843
2,0.8222,0.6728,0.2222,0.6667,0.3333,0.2593,0.3118
3,0.8,0.7685,0.3333,0.5,0.4,0.2857,0.2942
4,0.8,0.6265,0.2222,0.5,0.3077,0.2105,0.2343
Mean,0.823,0.7331,0.2756,0.7333,0.3892,0.3092,0.3658
Std,0.0244,0.0718,0.0777,0.2261,0.0961,0.1035,0.1222




Unnamed: 0,Description,Value
0,Session id,2817
1,Target,Closed_In_1Yr
2,Target type,Binary
3,Original data shape,"(1107, 14)"
4,Transformed data shape,"(1107, 11)"
5,Transformed train set shape,"(774, 11)"
6,Transformed test set shape,"(333, 11)"
7,Numeric features,13
8,Preprocess,True
9,Imputation type,simple


Unnamed: 0,Model,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC,TT (Sec)
rf,Random Forest Classifier,0.8553,0.7427,0.1902,0.5795,0.2743,0.2163,0.2614,0.069
nb,Naive Bayes,0.8345,0.728,0.1894,0.4025,0.253,0.1729,0.1909,0.006
lightgbm,Light Gradient Boosting Machine,0.8527,0.7237,0.2159,0.5494,0.2935,0.2299,0.2676,0.018
gbc,Gradient Boosting Classifier,0.8372,0.7211,0.1826,0.4013,0.2461,0.1701,0.1885,0.042
lda,Linear Discriminant Analysis,0.841,0.7161,0.0955,0.3983,0.148,0.0941,0.1261,0.005
et,Extra Trees Classifier,0.8488,0.6978,0.1811,0.5129,0.2559,0.1927,0.2285,0.053
qda,Quadratic Discriminant Analysis,0.8152,0.6746,0.2409,0.3443,0.2698,0.1711,0.1809,0.005
knn,K Neighbors Classifier,0.8411,0.6686,0.1826,0.4533,0.2514,0.18,0.2077,0.014
ada,Ada Boost Classifier,0.8179,0.6646,0.1136,0.2796,0.1562,0.0724,0.0851,0.024
dt,Decision Tree Classifier,0.7894,0.5982,0.2773,0.2964,0.2829,0.1614,0.1627,0.006


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.8205,0.8176,0.0,0.0,0.0,-0.046,-0.0692
1,0.859,0.8371,0.0833,1.0,0.1538,0.1333,0.2673
2,0.8718,0.8611,0.1667,1.0,0.2857,0.2529,0.3804
3,0.859,0.7702,0.0833,1.0,0.1538,0.1333,0.2673
4,0.8442,0.7796,0.0,0.0,0.0,-0.0244,-0.0468
5,0.8701,0.7507,0.1818,0.6667,0.2857,0.2391,0.3014
6,0.8701,0.8595,0.0909,1.0,0.1667,0.1463,0.281
7,0.8442,0.677,0.0909,0.3333,0.1429,0.087,0.1096
8,0.8831,0.6033,0.1818,1.0,0.3077,0.2759,0.4
9,0.8442,0.6821,0.0833,0.5,0.1429,0.1029,0.1549


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.8462,0.8024,0.0,0.0,0.0,0.0,0.0
1,0.8462,0.7828,0.0,0.0,0.0,0.0,0.0
2,0.8462,0.7626,0.0,0.0,0.0,0.0,0.0
3,0.8462,0.7235,0.0,0.0,0.0,0.0,0.0
4,0.8571,0.7479,0.0,0.0,0.0,0.0,0.0
5,0.8571,0.6653,0.0,0.0,0.0,0.0,0.0
6,0.8571,0.8581,0.0,0.0,0.0,0.0,0.0
7,0.8571,0.6371,0.0,0.0,0.0,0.0,0.0
8,0.8571,0.5579,0.0,0.0,0.0,0.0,0.0
9,0.8442,0.6897,0.0,0.0,0.0,0.0,0.0


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.859,0.7885,0.0833,1.0,0.1538,0.1333,0.2673
1,0.8846,0.8207,0.25,1.0,0.4,0.3607,0.469
2,0.8205,0.7955,0.1667,0.3333,0.2222,0.1333,0.1436
3,0.8718,0.7664,0.25,0.75,0.375,0.3229,0.3842
4,0.8701,0.781,0.0909,1.0,0.1667,0.1463,0.281
5,0.8571,0.7438,0.1818,0.5,0.2667,0.2062,0.2389
6,0.8831,0.8333,0.1818,1.0,0.3077,0.2759,0.4
7,0.8701,0.6921,0.2727,0.6,0.375,0.3137,0.3443
8,0.8442,0.5964,0.1818,0.4,0.25,0.1765,0.1936
9,0.8312,0.6705,0.1667,0.4,0.2353,0.1581,0.1774


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.8581,0.8172,0.0435,1.0,0.0833,0.0719,0.193
1,0.8516,0.8383,0.0,0.0,0.0,0.0,0.0
2,0.8516,0.7563,0.0,0.0,0.0,0.0,0.0
3,0.8516,0.7712,0.0,0.0,0.0,0.0,0.0
4,0.8506,0.6406,0.0,0.0,0.0,0.0,0.0
Mean,0.8527,0.7647,0.0087,0.2,0.0167,0.0144,0.0386
Std,0.0027,0.0688,0.0174,0.4,0.0333,0.0287,0.0772




Unnamed: 0,Description,Value
0,Session id,6079
1,Target,Closed_In_1Yr
2,Target type,Binary
3,Original data shape,"(205, 14)"
4,Transformed data shape,"(205, 11)"
5,Transformed train set shape,"(143, 11)"
6,Transformed test set shape,"(62, 11)"
7,Numeric features,13
8,Preprocess,True
9,Imputation type,simple


Unnamed: 0,Model,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC,TT (Sec)
lightgbm,Light Gradient Boosting Machine,0.8029,0.855,0.6,0.7286,0.616,0.4959,0.5243,0.006
gbc,Gradient Boosting Classifier,0.81,0.8522,0.65,0.6833,0.6383,0.5193,0.5371,0.012
rf,Random Forest Classifier,0.8314,0.8472,0.65,0.7567,0.6634,0.5603,0.5827,0.046
et,Extra Trees Classifier,0.831,0.8189,0.5917,0.7633,0.6348,0.5318,0.5574,0.041
knn,K Neighbors Classifier,0.7195,0.7935,0.4333,0.5283,0.4487,0.2715,0.2866,0.009
dt,Decision Tree Classifier,0.7895,0.7775,0.6833,0.6636,0.6337,0.4996,0.5261,0.004
ada,Ada Boost Classifier,0.7962,0.7703,0.5917,0.6583,0.5857,0.4565,0.4814,0.012
lda,Linear Discriminant Analysis,0.6838,0.6767,0.0833,0.1583,0.0983,0.0064,0.0155,0.005
nb,Naive Bayes,0.28,0.6599,0.9667,0.2648,0.4153,-0.0015,0.0036,0.004
qda,Quadratic Discriminant Analysis,0.4214,0.6491,0.8667,0.2982,0.4428,0.0798,0.1303,0.004


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.8667,0.9545,0.5,1.0,0.6667,0.5946,0.6504
1,0.8,0.6591,0.25,1.0,0.4,0.3284,0.4432
2,0.9333,0.9773,0.75,1.0,0.8571,0.8148,0.8292
3,0.8571,0.7576,0.3333,1.0,0.5,0.44,0.5311
4,0.8571,0.6667,0.6667,0.6667,0.6667,0.5758,0.5758
5,0.8571,1.0,0.5,1.0,0.6667,0.5882,0.6455
6,0.8571,0.9375,0.5,1.0,0.6667,0.5882,0.6455
7,0.7857,0.875,0.25,1.0,0.4,0.3226,0.4385
8,0.7857,0.775,0.25,1.0,0.4,0.3226,0.4385
9,0.8571,0.95,0.5,1.0,0.6667,0.5882,0.6455


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.9333,0.9545,1.0,0.8,0.8889,0.8421,0.8528
1,0.7333,0.7045,0.25,0.5,0.3333,0.1892,0.207
2,0.9333,0.9545,0.75,1.0,0.8571,0.8148,0.8292
3,0.7143,0.697,0.3333,0.3333,0.3333,0.1515,0.1515
4,0.7143,0.6667,0.6667,0.4,0.5,0.3171,0.3373
5,0.9286,1.0,0.75,1.0,0.8571,0.8108,0.8257
6,0.8571,0.9875,1.0,0.6667,0.8,0.6957,0.7303
7,0.8571,1.0,0.5,1.0,0.6667,0.5882,0.6455
8,0.8571,0.65,0.5,1.0,0.6667,0.5882,0.6455
9,0.7857,0.925,0.5,0.6667,0.5714,0.4324,0.4404


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.9333,0.9545,1.0,0.8,0.8889,0.8421,0.8528
1,0.8,0.6818,0.25,1.0,0.4,0.3284,0.4432
2,0.9333,1.0,0.75,1.0,0.8571,0.8148,0.8292
3,0.7143,0.7576,0.3333,0.3333,0.3333,0.1515,0.1515
4,0.6429,0.7273,0.6667,0.3333,0.4444,0.2222,0.2513
5,1.0,1.0,1.0,1.0,1.0,1.0,1.0
6,0.8571,0.9625,0.75,0.75,0.75,0.65,0.65
7,0.8571,0.85,0.5,1.0,0.6667,0.5882,0.6455
8,0.7857,0.625,0.5,0.6667,0.5714,0.4324,0.4404
9,0.7857,0.925,0.5,0.6667,0.5714,0.4324,0.4404


Fitting 10 folds for each of 10 candidates, totalling 100 fits
Original model was better than the tuned model, hence it will be returned. NOTE: The display metrics are for the tuned model (not the original one).


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.8621,0.8631,0.625,0.8333,0.7143,0.6258,0.6371
1,0.8621,0.881,0.625,0.8333,0.7143,0.6258,0.6371
2,0.8276,0.878,0.875,0.6364,0.7368,0.6133,0.6305
3,0.8571,0.8741,0.7143,0.7143,0.7143,0.619,0.619
4,0.8214,0.8095,0.5714,0.6667,0.6154,0.5,0.5025
Mean,0.8461,0.8611,0.6821,0.7368,0.699,0.5968,0.6052
Std,0.0178,0.0265,0.1068,0.0826,0.0427,0.0486,0.0518




Unnamed: 0,Description,Value
0,Session id,8902
1,Target,Closed_In_1Yr
2,Target type,Binary
3,Original data shape,"(435, 22)"
4,Transformed data shape,"(435, 11)"
5,Transformed train set shape,"(304, 11)"
6,Transformed test set shape,"(131, 11)"
7,Numeric features,21
8,Preprocess,True
9,Imputation type,simple


Unnamed: 0,Model,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC,TT (Sec)
gbc,Gradient Boosting Classifier,0.9014,0.6424,0.2167,0.3333,0.2467,0.2099,0.2223,0.021
rf,Random Forest Classifier,0.9046,0.638,0.1667,0.2833,0.19,0.1625,0.1788,0.049
lightgbm,Light Gradient Boosting Machine,0.8982,0.6304,0.1,0.125,0.1,0.0765,0.0802,0.009
ada,Ada Boost Classifier,0.8878,0.6124,0.25,0.3533,0.2652,0.2149,0.2296,0.015
dt,Decision Tree Classifier,0.8488,0.6085,0.25,0.145,0.1816,0.1081,0.1151,0.005
dummy,Dummy Classifier,0.9113,0.5,0.0,0.0,0.0,0.0,0.0,0.006
et,Extra Trees Classifier,0.9047,0.4655,0.1,0.1,0.1,0.0831,0.0819,0.046
lr,Logistic Regression,0.7473,0.4595,0.2167,0.0681,0.1024,-0.0017,0.0016,0.03
knn,K Neighbors Classifier,0.908,0.4378,0.0,0.0,0.0,-0.0047,-0.005,0.012
qda,Quadratic Discriminant Analysis,0.5492,0.4275,0.3667,0.0553,0.0948,-0.0264,-0.0521,0.006


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.9032,0.3512,0.0,0.0,0.0,0.0,0.0
1,0.9032,0.6429,0.0,0.0,0.0,0.0,0.0
2,0.9032,0.7738,0.0,0.0,0.0,0.0,0.0
3,0.9032,0.619,0.0,0.0,0.0,0.0,0.0
4,0.9333,0.5446,0.0,0.0,0.0,0.0,0.0
5,0.9333,0.9286,0.0,0.0,0.0,0.0,0.0
6,0.9333,0.5357,0.0,0.0,0.0,0.0,0.0
7,0.9,0.642,0.0,0.0,0.0,0.0,0.0
8,0.9,0.6296,0.0,0.0,0.0,0.0,0.0
9,0.9,0.6173,0.0,0.0,0.0,0.0,0.0


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.9032,0.5,0.0,0.0,0.0,0.0,0.0
1,0.9032,0.5,0.0,0.0,0.0,0.0,0.0
2,0.9032,0.5,0.0,0.0,0.0,0.0,0.0
3,0.9032,0.5,0.0,0.0,0.0,0.0,0.0
4,0.9333,0.5,0.0,0.0,0.0,0.0,0.0
5,0.9333,0.5,0.0,0.0,0.0,0.0,0.0
6,0.9333,0.5,0.0,0.0,0.0,0.0,0.0
7,0.9,0.5,0.0,0.0,0.0,0.0,0.0
8,0.9,0.5,0.0,0.0,0.0,0.0,0.0
9,0.9,0.5,0.0,0.0,0.0,0.0,0.0


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.9032,0.3214,0.0,0.0,0.0,0.0,0.0
1,0.9032,0.5,0.0,0.0,0.0,0.0,0.0
2,0.9032,0.5,0.0,0.0,0.0,0.0,0.0
3,0.9032,0.5,0.0,0.0,0.0,0.0,0.0
4,0.9333,0.5,0.0,0.0,0.0,0.0,0.0
5,0.9333,0.5,0.0,0.0,0.0,0.0,0.0
6,0.9333,0.5,0.0,0.0,0.0,0.0,0.0
7,0.9,0.5,0.0,0.0,0.0,0.0,0.0
8,0.9,0.5,0.0,0.0,0.0,0.0,0.0
9,0.9,0.5,0.0,0.0,0.0,0.0,0.0


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.918,0.2786,0.0,0.0,0.0,0.0,0.0
1,0.918,0.5893,0.0,0.0,0.0,0.0,0.0
2,0.9016,0.6667,0.0,0.0,0.0,0.0,0.0
3,0.9016,0.6636,0.0,0.0,0.0,0.0,0.0
4,0.9167,0.5709,0.0,0.0,0.0,0.0,0.0
Mean,0.9112,0.5538,0.0,0.0,0.0,0.0,0.0
Std,0.0078,0.1429,0.0,0.0,0.0,0.0,0.0





 50%|█████████████████████████████████████████████████████████████████████████████████████████████████████                                                                                                     | 1/2 [01:49<01:49, 109.92s/it][A

Unnamed: 0,Description,Value
0,Session id,4989
1,Target,Closed_In_1Yr
2,Target type,Binary
3,Original data shape,"(828, 22)"
4,Transformed data shape,"(828, 11)"
5,Transformed train set shape,"(579, 11)"
6,Transformed test set shape,"(249, 11)"
7,Numeric features,21
8,Preprocess,True
9,Imputation type,simple


Unnamed: 0,Model,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC,TT (Sec)
lightgbm,Light Gradient Boosting Machine,0.7943,0.6188,0.1455,0.3883,0.2082,0.1208,0.1404,0.012
et,Extra Trees Classifier,0.7979,0.6112,0.1,0.3726,0.1544,0.0855,0.1092,0.05
rf,Random Forest Classifier,0.8082,0.6056,0.0909,0.4167,0.1484,0.0964,0.1357,0.06
lda,Linear Discriminant Analysis,0.8031,0.6014,0.0455,0.35,0.0795,0.0396,0.0721,0.005
gbc,Gradient Boosting Classifier,0.7858,0.6007,0.1,0.3283,0.1517,0.0642,0.082,0.028
ada,Ada Boost Classifier,0.7788,0.5812,0.1455,0.3275,0.1958,0.0917,0.1036,0.016
lr,Logistic Regression,0.7495,0.572,0.1727,0.2302,0.1957,0.0622,0.0631,0.038
qda,Quadratic Discriminant Analysis,0.2625,0.5568,0.9,0.1939,0.3169,0.0078,0.0097,0.005
knn,K Neighbors Classifier,0.7926,0.5557,0.1,0.3317,0.1512,0.0749,0.0917,0.014
dt,Decision Tree Classifier,0.7167,0.5538,0.2909,0.2778,0.2806,0.1066,0.1076,0.007


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.8103,0.4836,0.0,0.0,0.0,0.0,0.0
1,0.8103,0.499,0.0,0.0,0.0,0.0,0.0
2,0.8103,0.6015,0.0,0.0,0.0,0.0,0.0
3,0.8103,0.5745,0.0,0.0,0.0,0.0,0.0
4,0.8103,0.5938,0.0,0.0,0.0,0.0,0.0
5,0.8103,0.6538,0.0,0.0,0.0,0.0,0.0
6,0.8103,0.824,0.0,0.0,0.0,0.0,0.0
7,0.8103,0.7137,0.0,0.0,0.0,0.0,0.0
8,0.8103,0.6673,0.0,0.0,0.0,0.0,0.0
9,0.807,0.5652,0.0,0.0,0.0,0.0,0.0


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.8103,0.5,0.0,0.0,0.0,0.0,0.0
1,0.8103,0.5,0.0,0.0,0.0,0.0,0.0
2,0.8103,0.5,0.0,0.0,0.0,0.0,0.0
3,0.8103,0.5,0.0,0.0,0.0,0.0,0.0
4,0.8103,0.5,0.0,0.0,0.0,0.0,0.0
5,0.8103,0.5,0.0,0.0,0.0,0.0,0.0
6,0.8103,0.5,0.0,0.0,0.0,0.0,0.0
7,0.8103,0.5,0.0,0.0,0.0,0.0,0.0
8,0.8103,0.5,0.0,0.0,0.0,0.0,0.0
9,0.807,0.5,0.0,0.0,0.0,0.0,0.0


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.8103,0.5,0.0,0.0,0.0,0.0,0.0
1,0.8103,0.5,0.0,0.0,0.0,0.0,0.0
2,0.8103,0.5,0.0,0.0,0.0,0.0,0.0
3,0.8103,0.5,0.0,0.0,0.0,0.0,0.0
4,0.8103,0.5,0.0,0.0,0.0,0.0,0.0
5,0.8103,0.5,0.0,0.0,0.0,0.0,0.0
6,0.8103,0.5,0.0,0.0,0.0,0.0,0.0
7,0.8103,0.5,0.0,0.0,0.0,0.0,0.0
8,0.8103,0.5,0.0,0.0,0.0,0.0,0.0
9,0.807,0.5,0.0,0.0,0.0,0.0,0.0


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.8103,0.4599,0.0,0.0,0.0,0.0,0.0
1,0.8103,0.5837,0.0,0.0,0.0,0.0,0.0
2,0.8103,0.6204,0.0,0.0,0.0,0.0,0.0
3,0.8103,0.7336,0.0,0.0,0.0,0.0,0.0
4,0.8087,0.6017,0.0,0.0,0.0,0.0,0.0
Mean,0.81,0.5998,0.0,0.0,0.0,0.0,0.0
Std,0.0007,0.0874,0.0,0.0,0.0,0.0,0.0




Unnamed: 0,Description,Value
0,Session id,6213
1,Target,Closed_In_1Yr
2,Target type,Binary
3,Original data shape,"(203, 14)"
4,Transformed data shape,"(203, 11)"
5,Transformed train set shape,"(142, 11)"
6,Transformed test set shape,"(61, 11)"
7,Numeric features,13
8,Preprocess,True
9,Imputation type,simple


Unnamed: 0,Model,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC,TT (Sec)
lda,Linear Discriminant Analysis,0.6914,0.6931,0.135,0.3667,0.1919,0.0886,0.1063,0.005
et,Extra Trees Classifier,0.6705,0.6833,0.23,0.3517,0.2607,0.1038,0.1116,0.037
rf,Random Forest Classifier,0.691,0.6511,0.205,0.45,0.2662,0.1287,0.1473,0.049
qda,Quadratic Discriminant Analysis,0.4157,0.6437,0.81,0.3212,0.4582,0.0349,0.0655,0.005
lr,Logistic Regression,0.6548,0.6365,0.225,0.2733,0.2398,0.0705,0.0737,0.025
nb,Naive Bayes,0.4229,0.6215,0.88,0.3332,0.482,0.0654,0.1381,0.004
knn,K Neighbors Classifier,0.6495,0.5947,0.215,0.3417,0.2607,0.0714,0.073,0.01
lightgbm,Light Gradient Boosting Machine,0.6476,0.5911,0.31,0.4143,0.3401,0.118,0.1203,0.006
ada,Ada Boost Classifier,0.6424,0.5861,0.35,0.41,0.3652,0.1248,0.1317,0.015
gbc,Gradient Boosting Classifier,0.649,0.5692,0.245,0.3417,0.2821,0.0749,0.0684,0.013


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.7333,0.52,0.2,1.0,0.3333,0.25,0.378
1,0.5333,0.36,0.0,0.0,0.0,-0.2353,-0.2774
2,0.5714,0.6222,0.0,0.0,0.0,-0.1351,-0.2067
3,0.7143,0.7111,0.4,0.6667,0.5,0.3171,0.3373
4,0.7143,0.625,0.0,0.0,0.0,0.0,0.0
5,0.7857,0.725,0.25,1.0,0.4,0.3226,0.4385
6,0.7143,0.8125,0.25,0.5,0.3333,0.1765,0.1936
7,0.7143,0.725,0.0,0.0,0.0,0.0,0.0
8,0.7143,1.0,0.0,0.0,0.0,0.0,0.0
9,0.7857,0.85,0.25,1.0,0.4,0.3226,0.4385


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.6667,0.55,0.0,0.0,0.0,0.0,0.0
1,0.6667,0.54,0.0,0.0,0.0,0.0,0.0
2,0.6429,0.6333,0.0,0.0,0.0,0.0,0.0
3,0.6429,0.6333,0.0,0.0,0.0,0.0,0.0
4,0.7143,0.5625,0.0,0.0,0.0,0.0,0.0
5,0.7143,0.775,0.0,0.0,0.0,0.0,0.0
6,0.7143,0.575,0.0,0.0,0.0,0.0,0.0
7,0.7143,0.625,0.0,0.0,0.0,0.0,0.0
8,0.7143,0.8,0.0,0.0,0.0,0.0,0.0
9,0.7143,0.8375,0.0,0.0,0.0,0.0,0.0


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.6667,0.5,0.0,0.0,0.0,0.0,0.0
1,0.6667,0.5,0.0,0.0,0.0,0.0,0.0
2,0.6429,0.5,0.0,0.0,0.0,0.0,0.0
3,0.6429,0.5,0.0,0.0,0.0,0.0,0.0
4,0.7143,0.5,0.0,0.0,0.0,0.0,0.0
5,0.7143,0.5,0.0,0.0,0.0,0.0,0.0
6,0.7143,0.5,0.0,0.0,0.0,0.0,0.0
7,0.7143,0.5,0.0,0.0,0.0,0.0,0.0
8,0.7143,0.5,0.0,0.0,0.0,0.0,0.0
9,0.7143,0.5,0.0,0.0,0.0,0.0,0.0


Fitting 10 folds for each of 10 candidates, totalling 100 fits
Original model was better than the tuned model, hence it will be returned. NOTE: The display metrics are for the tuned model (not the original one).


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.7241,0.5278,0.1111,1.0,0.2,0.1471,0.2817
1,0.7241,0.7056,0.1111,1.0,0.2,0.1471,0.2817
2,0.7143,0.6784,0.1111,1.0,0.2,0.145,0.2796
3,0.7143,0.7924,0.2222,0.6667,0.3333,0.2057,0.2561
4,0.7143,0.6812,0.0,0.0,0.0,0.0,0.0
Mean,0.7182,0.6771,0.1111,0.7333,0.1867,0.129,0.2198
Std,0.0048,0.0853,0.0703,0.3887,0.1067,0.0685,0.1103


Unnamed: 0,Description,Value
0,Session id,6150
1,Target,Closed_In_1Yr
2,Target type,Binary
3,Original data shape,"(505, 14)"
4,Transformed data shape,"(505, 11)"
5,Transformed train set shape,"(353, 11)"
6,Transformed test set shape,"(152, 11)"
7,Numeric features,13
8,Preprocess,True
9,Imputation type,simple


Unnamed: 0,Model,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC,TT (Sec)
knn,K Neighbors Classifier,0.7221,0.5743,0.1911,0.2527,0.2154,0.0694,0.0674,0.011
rf,Random Forest Classifier,0.7621,0.5713,0.1018,0.4167,0.1564,0.074,0.107,0.056
ada,Ada Boost Classifier,0.7221,0.5612,0.1911,0.2598,0.2055,0.0687,0.0703,0.016
et,Extra Trees Classifier,0.7393,0.5434,0.0893,0.2667,0.1241,0.0202,0.0255,0.049
lightgbm,Light Gradient Boosting Machine,0.7137,0.5129,0.1411,0.268,0.1639,0.0202,0.0263,0.008
gbc,Gradient Boosting Classifier,0.7192,0.503,0.1143,0.2443,0.1483,0.0119,0.0144,0.021
dummy,Dummy Classifier,0.7762,0.5,0.0,0.0,0.0,0.0,0.0,0.005
lda,Linear Discriminant Analysis,0.762,0.496,0.0,0.0,0.0,-0.0253,-0.0358,0.006
dt,Decision Tree Classifier,0.617,0.4835,0.2161,0.1871,0.1968,-0.0494,-0.0496,0.005
qda,Quadratic Discriminant Analysis,0.6619,0.4738,0.15,0.0404,0.0636,-0.0379,-0.0656,0.006


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.7778,0.5603,0.0,0.0,0.0,0.0,0.0
1,0.7778,0.4799,0.0,0.0,0.0,0.0,0.0
2,0.7778,0.6853,0.0,0.0,0.0,0.0,0.0
3,0.7714,0.5463,0.0,0.0,0.0,0.0,0.0
4,0.7714,0.5764,0.0,0.0,0.0,0.0,0.0
5,0.7714,0.6458,0.0,0.0,0.0,0.0,0.0
6,0.7714,0.6157,0.0,0.0,0.0,0.0,0.0
7,0.7714,0.7014,0.0,0.0,0.0,0.0,0.0
8,0.7714,0.5972,0.0,0.0,0.0,0.0,0.0
9,0.8,0.6582,0.0,0.0,0.0,0.0,0.0


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.7778,0.5,0.0,0.0,0.0,0.0,0.0
1,0.7778,0.5,0.0,0.0,0.0,0.0,0.0
2,0.7778,0.5,0.0,0.0,0.0,0.0,0.0
3,0.7714,0.5,0.0,0.0,0.0,0.0,0.0
4,0.7714,0.5,0.0,0.0,0.0,0.0,0.0
5,0.7714,0.5,0.0,0.0,0.0,0.0,0.0
6,0.7714,0.5,0.0,0.0,0.0,0.0,0.0
7,0.7714,0.5,0.0,0.0,0.0,0.0,0.0
8,0.7714,0.5,0.0,0.0,0.0,0.0,0.0
9,0.8,0.5,0.0,0.0,0.0,0.0,0.0


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.7778,0.5,0.0,0.0,0.0,0.0,0.0
1,0.7778,0.5,0.0,0.0,0.0,0.0,0.0
2,0.7778,0.5,0.0,0.0,0.0,0.0,0.0
3,0.7714,0.5,0.0,0.0,0.0,0.0,0.0
4,0.7714,0.5,0.0,0.0,0.0,0.0,0.0
5,0.7714,0.5,0.0,0.0,0.0,0.0,0.0
6,0.7714,0.5,0.0,0.0,0.0,0.0,0.0
7,0.7714,0.5,0.0,0.0,0.0,0.0,0.0
8,0.7714,0.5,0.0,0.0,0.0,0.0,0.0
9,0.8,0.5,0.0,0.0,0.0,0.0,0.0


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.7746,0.5398,0.0,0.0,0.0,0.0,0.0
1,0.7746,0.5972,0.0,0.0,0.0,0.0,0.0
2,0.7746,0.5642,0.0,0.0,0.0,0.0,0.0
3,0.7714,0.7014,0.0,0.0,0.0,0.0,0.0
4,0.7857,0.6236,0.0,0.0,0.0,0.0,0.0
Mean,0.7762,0.6052,0.0,0.0,0.0,0.0,0.0
Std,0.0049,0.0559,0.0,0.0,0.0,0.0,0.0


Unnamed: 0,Description,Value
0,Session id,3499
1,Target,Closed_In_1Yr
2,Target type,Binary
3,Original data shape,"(65, 14)"
4,Transformed data shape,"(65, 11)"
5,Transformed train set shape,"(45, 11)"
6,Transformed test set shape,"(20, 11)"
7,Numeric features,13
8,Preprocess,True
9,Imputation type,simple


Unnamed: 0,Model,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC,TT (Sec)
ada,Ada Boost Classifier,0.725,0.7458,0.6,0.6667,0.5967,0.3992,0.43,0.011
et,Extra Trees Classifier,0.665,0.7125,0.45,0.6,0.4833,0.2558,0.2837,0.035
rf,Random Forest Classifier,0.635,0.6792,0.4,0.55,0.4333,0.1755,0.2079,0.042
dt,Decision Tree Classifier,0.67,0.6375,0.6,0.55,0.5367,0.2889,0.321,0.004
knn,K Neighbors Classifier,0.615,0.5875,0.45,0.4667,0.43,0.1447,0.1765,0.01
gbc,Gradient Boosting Classifier,0.615,0.5708,0.55,0.5,0.4833,0.1829,0.2208,0.009
qda,Quadratic Discriminant Analysis,0.555,0.5625,0.55,0.3733,0.4338,0.0747,0.0754,0.005
lr,Logistic Regression,0.6,0.5375,0.35,0.4667,0.38,0.11,0.1207,0.023
nb,Naive Bayes,0.425,0.5042,0.9,0.375,0.5257,-0.0333,-0.0333,0.005
dummy,Dummy Classifier,0.6,0.5,0.0,0.0,0.0,0.0,0.0,0.005


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,1.0,1.0,1.0,1.0,1.0,1.0,1.0
1,0.8,0.9167,0.5,1.0,0.6667,0.5455,0.6124
2,0.8,0.5,0.5,1.0,0.6667,0.5455,0.6124
3,0.6,0.5,1.0,0.5,0.6667,0.2857,0.4082
4,0.8,1.0,0.5,1.0,0.6667,0.5455,0.6124
5,0.75,0.6667,0.0,0.0,0.0,0.0,0.0
6,0.75,1.0,1.0,0.5,0.6667,0.5,0.5774
7,0.25,0.0,0.0,0.0,0.0,-0.5,-0.5774
8,1.0,1.0,1.0,1.0,1.0,1.0,1.0
9,0.5,0.625,0.5,0.5,0.5,0.0,0.0


Fitting 10 folds for each of 10 candidates, totalling 100 fits
Original model was better than the tuned model, hence it will be returned. NOTE: The display metrics are for the tuned model (not the original one).


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.8,0.8333,0.5,1.0,0.6667,0.5455,0.6124
1,0.8,0.6667,0.5,1.0,0.6667,0.5455,0.6124
2,0.8,0.6667,0.5,1.0,0.6667,0.5455,0.6124
3,0.6,0.8333,1.0,0.5,0.6667,0.2857,0.4082
4,0.8,0.6667,0.5,1.0,0.6667,0.5455,0.6124
5,0.5,0.0,0.0,0.0,0.0,-0.3333,-0.3333
6,0.75,0.0,0.0,0.0,0.0,0.0,0.0
7,0.5,0.5,0.5,0.5,0.5,0.0,0.0
8,0.75,0.5,0.5,1.0,0.6667,0.5,0.5774
9,0.5,0.625,0.5,0.5,0.5,0.0,0.0


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.8,1.0,0.5,1.0,0.6667,0.5455,0.6124
1,0.6,0.75,0.5,0.5,0.5,0.1667,0.1667
2,0.8,0.75,0.5,1.0,0.6667,0.5455,0.6124
3,0.8,0.8333,1.0,0.6667,0.8,0.6154,0.6667
4,0.6,0.5833,0.5,0.5,0.5,0.1667,0.1667
5,0.75,0.5,0.0,0.0,0.0,0.0,0.0
6,0.5,0.3333,0.0,0.0,0.0,-0.3333,-0.3333
7,0.25,0.25,0.0,0.0,0.0,-0.5,-0.5774
8,1.0,1.0,1.0,1.0,1.0,1.0,1.0
9,0.75,0.75,1.0,0.6667,0.8,0.5,0.5774


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.6667,0.8889,0.3333,0.5,0.4,0.1818,0.189
1,0.7778,0.75,0.6667,0.6667,0.6667,0.5,0.5
2,0.8889,1.0,1.0,0.8,0.8889,0.7805,0.8
3,0.3333,0.3,0.25,0.25,0.25,-0.35,-0.35
4,0.6667,0.65,0.75,0.6,0.6667,0.3415,0.35
Mean,0.6667,0.7178,0.6,0.5633,0.5744,0.2908,0.2978
Std,0.1859,0.2405,0.2759,0.1845,0.2243,0.3765,0.3814


Unnamed: 0,Description,Value
0,Session id,6519
1,Target,Closed_In_1Yr
2,Target type,Binary
3,Original data shape,"(294, 22)"
4,Transformed data shape,"(294, 11)"
5,Transformed train set shape,"(205, 11)"
6,Transformed test set shape,"(89, 11)"
7,Numeric features,21
8,Preprocess,True
9,Imputation type,simple


Unnamed: 0,Model,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC,TT (Sec)
lr,Logistic Regression,0.7269,0.6113,0.1767,0.3917,0.2198,0.1057,0.1316,0.025
lda,Linear Discriminant Analysis,0.7119,0.5959,0.04,0.0833,0.0536,-0.0272,-0.0431,0.006
nb,Naive Bayes,0.7031,0.5956,0.2367,0.3786,0.2355,0.1068,0.1356,0.005
qda,Quadratic Discriminant Analysis,0.4529,0.5894,0.7233,0.2862,0.4078,0.0635,0.0772,0.005
rf,Random Forest Classifier,0.7121,0.5813,0.0967,0.2083,0.1202,0.0196,0.024,0.048
gbc,Gradient Boosting Classifier,0.7169,0.5749,0.2067,0.3967,0.2547,0.1114,0.13,0.015
knn,K Neighbors Classifier,0.6776,0.5662,0.1667,0.225,0.1872,0.0155,0.012,0.01
dt,Decision Tree Classifier,0.6083,0.547,0.3467,0.3096,0.3152,0.0515,0.0535,0.005
et,Extra Trees Classifier,0.6783,0.5394,0.0533,0.225,0.0819,-0.0665,-0.0588,0.045
ada,Ada Boost Classifier,0.6636,0.5138,0.1,0.1,0.1,-0.0601,-0.0703,0.013


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.7619,0.55,0.2,0.5,0.2857,0.1732,0.1995
1,0.8095,1.0,0.2,1.0,0.3333,0.2759,0.4
2,0.7143,0.65,0.2,0.3333,0.25,0.087,0.0913
3,0.619,0.5889,0.1667,0.25,0.2,-0.037,-0.0383
4,0.7143,0.6444,0.0,0.0,0.0,0.0,0.0
5,0.7,0.6133,0.2,0.3333,0.25,0.0769,0.0808
6,0.65,0.3067,0.0,0.0,0.0,-0.1667,-0.1925
7,0.8,0.5333,0.2,1.0,0.3333,0.2727,0.3974
8,0.75,0.52,0.0,0.0,0.0,0.0,0.0
9,0.75,0.7067,0.6,0.5,0.5455,0.375,0.378


Fitting 10 folds for each of 10 candidates, totalling 100 fits
Original model was better than the tuned model, hence it will be returned. NOTE: The display metrics are for the tuned model (not the original one).


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.7143,0.525,0.2,0.3333,0.25,0.087,0.0913
1,0.8095,0.775,0.2,1.0,0.3333,0.2759,0.4
2,0.7143,0.6125,0.2,0.3333,0.25,0.087,0.0913
3,0.7143,0.7,0.3333,0.5,0.4,0.2222,0.2301
4,0.7143,0.5333,0.0,0.0,0.0,0.0,0.0
5,0.75,0.56,0.2,0.5,0.2857,0.1667,0.1925
6,0.65,0.3933,0.0,0.0,0.0,-0.1667,-0.1925
7,0.8,0.46,0.2,1.0,0.3333,0.2727,0.3974
8,0.75,0.6333,0.0,0.0,0.0,0.0,0.0
9,0.75,0.6933,0.6,0.5,0.5455,0.375,0.378


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.7619,0.5625,0.2,0.5,0.2857,0.1732,0.1995
1,0.8095,0.95,0.2,1.0,0.3333,0.2759,0.4
2,0.7143,0.675,0.2,0.3333,0.25,0.087,0.0913
3,0.6667,0.5222,0.1667,0.3333,0.2222,0.0392,0.043
4,0.7143,0.6222,0.0,0.0,0.0,0.0,0.0
5,0.7,0.5467,0.2,0.3333,0.25,0.0769,0.0808
6,0.65,0.3333,0.0,0.0,0.0,-0.1667,-0.1925
7,0.8,0.52,0.2,1.0,0.3333,0.2727,0.3974
8,0.75,0.68,0.0,0.0,0.0,0.0,0.0
9,0.75,0.6,0.6,0.5,0.5455,0.375,0.378


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.7805,0.771,0.2,0.6667,0.3077,0.2199,0.2766
1,0.6829,0.5839,0.2,0.2857,0.2353,0.0431,0.0442
2,0.7561,0.5419,0.1,0.5,0.1667,0.0929,0.135
3,0.6829,0.3667,0.0,0.0,0.0,-0.09,-0.1371
4,0.7561,0.6273,0.3636,0.5714,0.4444,0.2979,0.3104
Mean,0.7317,0.5781,0.1727,0.4048,0.2308,0.1128,0.1258
Std,0.0408,0.1309,0.1209,0.2381,0.1476,0.1357,0.1629



100%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 2/2 [03:12<00:00, 96.11s/it][A
 50%|█████████████████████████████████████████████████████████████████████████████████████████████████████                                                                                                     | 1/2 [03:12<03:12, 192.22s/it]
  0%|                                                                                                                                                                                                                   | 0/2 [00:00<?, ?it/s][A

Unnamed: 0,Description,Value
0,Session id,933
1,Target,Closed_In_2Yrs
2,Target type,Binary
3,Original data shape,"(1800, 22)"
4,Transformed data shape,"(1800, 11)"
5,Transformed train set shape,"(1259, 11)"
6,Transformed test set shape,"(541, 11)"
7,Numeric features,21
8,Preprocess,True
9,Imputation type,simple


Unnamed: 0,Model,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC,TT (Sec)
rf,Random Forest Classifier,0.5758,0.5922,0.4221,0.5422,0.473,0.1278,0.131,0.085
gbc,Gradient Boosting Classifier,0.5639,0.5802,0.4221,0.5242,0.4665,0.1054,0.1074,0.058
ada,Ada Boost Classifier,0.5671,0.5789,0.4291,0.5294,0.4733,0.1125,0.1147,0.023
lightgbm,Light Gradient Boosting Machine,0.5631,0.5769,0.4642,0.5242,0.4914,0.1108,0.112,0.018
et,Extra Trees Classifier,0.5298,0.5499,0.3641,0.476,0.4107,0.0318,0.0327,0.064
qda,Quadratic Discriminant Analysis,0.5473,0.5364,0.396,0.5358,0.4191,0.0726,0.0849,0.005
dt,Decision Tree Classifier,0.529,0.5319,0.5027,0.4803,0.4907,0.053,0.0534,0.006
lr,Logistic Regression,0.502,0.5267,0.6497,0.4654,0.5418,0.0282,0.03,0.024
lda,Linear Discriminant Analysis,0.5584,0.509,0.1366,0.5522,0.2167,0.048,0.0705,0.005
nb,Naive Bayes,0.5536,0.5061,0.0771,0.5726,0.1332,0.0283,0.0563,0.005


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.5714,0.6444,0.5263,0.5263,0.5263,0.135,0.135
1,0.5635,0.5446,0.4386,0.5208,0.4762,0.1067,0.1079
2,0.5556,0.5708,0.4211,0.5106,0.4615,0.0891,0.0903
3,0.5556,0.5566,0.4737,0.5094,0.4909,0.0975,0.0977
4,0.619,0.6267,0.5614,0.5818,0.5714,0.2288,0.2289
5,0.6032,0.6428,0.4386,0.5814,0.5,0.1816,0.1866
6,0.5317,0.5469,0.4561,0.4815,0.4685,0.0506,0.0506
7,0.5794,0.6186,0.4386,0.5435,0.4854,0.1365,0.1388
8,0.5556,0.5532,0.5172,0.5172,0.5172,0.1055,0.1055
9,0.56,0.5728,0.5789,0.5156,0.5455,0.1219,0.1226


Fitting 10 folds for each of 10 candidates, totalling 100 fits
Original model was better than the tuned model, hence it will be returned. NOTE: The display metrics are for the tuned model (not the original one).


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.6032,0.6393,0.3158,0.6207,0.4186,0.1633,0.1849
1,0.6429,0.5812,0.2807,0.8,0.4156,0.2361,0.3034
2,0.5476,0.5723,0.1754,0.5,0.2597,0.0323,0.0416
3,0.5635,0.5718,0.2632,0.5357,0.3529,0.0782,0.0895
4,0.5794,0.5955,0.2632,0.5769,0.3614,0.1089,0.1276
5,0.6429,0.6471,0.3158,0.75,0.4444,0.241,0.2901
6,0.5635,0.5456,0.2281,0.5417,0.321,0.0723,0.087
7,0.5714,0.6089,0.2281,0.5652,0.325,0.0877,0.1071
8,0.5238,0.5266,0.2241,0.4643,0.3023,0.0037,0.0043
9,0.616,0.5777,0.3684,0.6364,0.4667,0.1987,0.2169


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.5714,0.5884,0.386,0.5366,0.449,0.1134,0.1175
1,0.5476,0.5782,0.2281,0.5,0.3133,0.0416,0.0488
2,0.6349,0.6386,0.4211,0.6486,0.5106,0.24,0.2543
3,0.5635,0.5394,0.386,0.5238,0.4444,0.0984,0.1015
4,0.5,0.5357,0.2632,0.4167,0.3226,-0.0426,-0.0454
5,0.6032,0.6189,0.3158,0.6207,0.4186,0.1633,0.1849
6,0.5556,0.5622,0.3158,0.5143,0.3913,0.0718,0.0771
7,0.6032,0.6331,0.3158,0.6207,0.4186,0.1633,0.1849
8,0.5952,0.5302,0.3448,0.6061,0.4396,0.1587,0.1742
9,0.536,0.5734,0.2982,0.4857,0.3696,0.0346,0.0372


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.623,0.6039,0.4123,0.6267,0.4974,0.2158,0.2279
1,0.5714,0.5799,0.3509,0.5405,0.4255,0.1078,0.1142
2,0.6389,0.6554,0.3947,0.6716,0.4972,0.2441,0.2651
3,0.5833,0.5811,0.3652,0.5676,0.4444,0.1355,0.144
4,0.5578,0.5903,0.3684,0.5185,0.4308,0.0858,0.0892
Mean,0.5949,0.6021,0.3783,0.585,0.4591,0.1578,0.1681
Std,0.0309,0.028,0.0221,0.0565,0.0318,0.0616,0.0674


Unnamed: 0,Description,Value
0,Session id,1446
1,Target,Closed_In_2Yrs
2,Target type,Binary
3,Original data shape,"(323, 14)"
4,Transformed data shape,"(323, 11)"
5,Transformed train set shape,"(226, 11)"
6,Transformed test set shape,"(97, 11)"
7,Numeric features,13
8,Preprocess,True
9,Imputation type,simple


Unnamed: 0,Model,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC,TT (Sec)
rf,Random Forest Classifier,0.6069,0.6458,0.6364,0.6246,0.6257,0.213,0.216,0.049
gbc,Gradient Boosting Classifier,0.581,0.6353,0.5955,0.6061,0.5946,0.1625,0.1655,0.015
et,Extra Trees Classifier,0.5943,0.6325,0.628,0.6087,0.617,0.1848,0.1855,0.04
lightgbm,Light Gradient Boosting Machine,0.6065,0.6256,0.6189,0.6247,0.6178,0.2131,0.2158,0.007
ada,Ada Boost Classifier,0.5581,0.5837,0.5939,0.5795,0.5829,0.1141,0.1159,0.013
dt,Decision Tree Classifier,0.5451,0.5586,0.5341,0.5783,0.5503,0.0917,0.0935,0.005
knn,K Neighbors Classifier,0.5051,0.5421,0.6098,0.5342,0.5648,-0.001,-0.0049,0.01
dummy,Dummy Classifier,0.5221,0.5,1.0,0.5221,0.6859,0.0,0.0,0.004
lr,Logistic Regression,0.4769,0.4498,0.6689,0.4904,0.5574,-0.0593,-0.0714,0.022
lda,Linear Discriminant Analysis,0.5176,0.4403,0.8644,0.523,0.6507,0.0043,0.0039,0.004


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.7391,0.6667,0.75,0.75,0.75,0.4773,0.4773
1,0.4783,0.4091,0.5,0.5,0.5,-0.0455,-0.0455
2,0.6087,0.5985,0.8333,0.5882,0.6897,0.2008,0.2241
3,0.6522,0.6364,0.8333,0.625,0.7143,0.2923,0.3125
4,0.6522,0.6894,0.5833,0.7,0.6364,0.3083,0.313
5,0.6522,0.6818,0.75,0.6429,0.6923,0.2977,0.3024
6,0.5455,0.6033,0.6364,0.5385,0.5833,0.0909,0.0925
7,0.5909,0.7273,0.8182,0.5625,0.6667,0.1818,0.2041
8,0.6818,0.6667,0.5833,0.7778,0.6667,0.374,0.3882
9,0.6818,0.6917,0.75,0.6923,0.72,0.3529,0.3545


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.6522,0.6212,0.6667,0.6667,0.6667,0.303,0.303
1,0.5217,0.4091,0.5,0.5455,0.5217,0.0453,0.0455
2,0.6522,0.6515,0.75,0.6429,0.6923,0.2977,0.3024
3,0.6522,0.6439,0.75,0.6429,0.6923,0.2977,0.3024
4,0.6087,0.6742,0.5,0.6667,0.5714,0.2247,0.2326
5,0.6522,0.6136,0.75,0.6429,0.6923,0.2977,0.3024
6,0.5455,0.6116,0.6364,0.5385,0.5833,0.0909,0.0925
7,0.6364,0.7107,0.8182,0.6,0.6923,0.2727,0.2928
8,0.6364,0.7083,0.5833,0.7,0.6364,0.2787,0.2833
9,0.6818,0.6667,0.75,0.6923,0.72,0.3529,0.3545


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.6087,0.6136,0.75,0.6,0.6667,0.2069,0.2145
1,0.6087,0.5985,0.8333,0.5882,0.6897,0.2008,0.2241
2,0.6087,0.5682,0.75,0.6,0.6667,0.2069,0.2145
3,0.4348,0.4015,0.6667,0.4706,0.5517,-0.1544,-0.1724
4,0.6087,0.6364,0.6667,0.6154,0.64,0.2129,0.2137
5,0.6522,0.553,0.9167,0.6111,0.7333,0.2868,0.3395
6,0.5455,0.7107,0.8182,0.5294,0.6429,0.0909,0.1085
7,0.5455,0.4959,0.6364,0.5385,0.5833,0.0909,0.0925
8,0.6364,0.625,0.75,0.6429,0.6923,0.2542,0.2588
9,0.5909,0.5083,0.75,0.6,0.6667,0.1538,0.1604


Fitting 10 folds for each of 10 candidates, totalling 100 fits
Original model was better than the tuned model, hence it will be returned. NOTE: The display metrics are for the tuned model (not the original one).


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.6304,0.6307,0.625,0.6522,0.6383,0.2609,0.2611
1,0.5778,0.6344,0.6522,0.5769,0.6122,0.1526,0.154
2,0.5556,0.587,0.5217,0.5714,0.5455,0.1124,0.1129
3,0.6667,0.7123,0.7917,0.6552,0.717,0.3202,0.3288
4,0.6889,0.7242,0.5833,0.7778,0.6667,0.386,0.4001
Mean,0.6239,0.6577,0.6348,0.6467,0.6359,0.2464,0.2514
Std,0.0508,0.0523,0.0899,0.0746,0.057,0.1019,0.1066


Unnamed: 0,Description,Value
0,Session id,221
1,Target,Closed_In_2Yrs
2,Target type,Binary
3,Original data shape,"(1107, 14)"
4,Transformed data shape,"(1107, 11)"
5,Transformed train set shape,"(774, 11)"
6,Transformed test set shape,"(333, 11)"
7,Numeric features,13
8,Preprocess,True
9,Imputation type,simple


Unnamed: 0,Model,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC,TT (Sec)
rf,Random Forest Classifier,0.6162,0.6513,0.5048,0.6134,0.5506,0.2224,0.2267,0.067
et,Extra Trees Classifier,0.5852,0.6381,0.4724,0.5792,0.5182,0.1605,0.1645,0.056
lightgbm,Light Gradient Boosting Machine,0.5982,0.6328,0.5436,0.5827,0.5596,0.1916,0.1938,0.016
gbc,Gradient Boosting Classifier,0.6046,0.6319,0.5327,0.5936,0.5589,0.203,0.2054,0.037
ada,Ada Boost Classifier,0.6097,0.6238,0.5351,0.6,0.5636,0.2128,0.2153,0.018
knn,K Neighbors Classifier,0.5736,0.6098,0.508,0.5552,0.5293,0.1412,0.1423,0.011
nb,Naive Bayes,0.5543,0.5733,0.1202,0.6496,0.2002,0.0665,0.111,0.005
lda,Linear Discriminant Analysis,0.5583,0.5637,0.2103,0.6088,0.3089,0.0834,0.1133,0.005
dt,Decision Tree Classifier,0.5514,0.5553,0.5019,0.5296,0.5127,0.0978,0.0993,0.006
qda,Quadratic Discriminant Analysis,0.5531,0.5472,0.1124,0.6821,0.1876,0.0638,0.1136,0.005


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.6026,0.675,0.4865,0.6,0.5373,0.1956,0.1989
1,0.6154,0.648,0.5135,0.6129,0.5588,0.2226,0.2253
2,0.6795,0.7126,0.5405,0.7143,0.6154,0.3496,0.3596
3,0.6026,0.6539,0.5946,0.5789,0.5867,0.2041,0.2041
4,0.6364,0.6572,0.5556,0.625,0.5882,0.2647,0.2661
5,0.6494,0.6585,0.5833,0.6364,0.6087,0.2921,0.293
6,0.5195,0.4953,0.3889,0.4828,0.4308,0.0233,0.0237
7,0.5714,0.6897,0.3333,0.5714,0.4211,0.1168,0.1275
8,0.6494,0.6764,0.4865,0.6923,0.5714,0.2897,0.3027
9,0.5325,0.6105,0.4595,0.5152,0.4857,0.0597,0.06


Fitting 10 folds for each of 10 candidates, totalling 100 fits
Original model was better than the tuned model, hence it will be returned. NOTE: The display metrics are for the tuned model (not the original one).


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.6538,0.6579,0.5676,0.6562,0.6087,0.3013,0.3038
1,0.5385,0.5656,0.4324,0.5161,0.4706,0.0671,0.0679
2,0.6282,0.6704,0.4595,0.6538,0.5397,0.2435,0.2542
3,0.5897,0.6546,0.4595,0.5862,0.5152,0.1686,0.1723
4,0.6104,0.5928,0.5,0.6,0.5455,0.2094,0.2121
5,0.5974,0.6348,0.4444,0.5926,0.5079,0.1789,0.1842
6,0.5065,0.5061,0.3889,0.4667,0.4242,-0.0014,-0.0014
7,0.5974,0.7012,0.3611,0.619,0.4561,0.1703,0.186
8,0.6234,0.6372,0.4595,0.6538,0.5397,0.2371,0.2477
9,0.6104,0.6307,0.4865,0.6207,0.5455,0.2132,0.2181


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.5897,0.6836,0.4324,0.5926,0.5,0.1663,0.1723
1,0.6026,0.6447,0.5946,0.5789,0.5867,0.2041,0.2041
2,0.641,0.6533,0.5676,0.6364,0.6,0.2763,0.2778
3,0.6538,0.6915,0.5946,0.6471,0.6197,0.3031,0.304
4,0.5974,0.6206,0.5556,0.5714,0.5634,0.19,0.1901
5,0.6104,0.6423,0.6111,0.5789,0.5946,0.2201,0.2204
6,0.5195,0.5176,0.4722,0.4857,0.4789,0.0333,0.0333
7,0.6494,0.6531,0.5,0.6667,0.5714,0.2848,0.2933
8,0.6104,0.6547,0.6216,0.5897,0.6053,0.2212,0.2215
9,0.5974,0.5963,0.4324,0.6154,0.5079,0.1845,0.1927


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.5871,0.6535,0.5479,0.5634,0.5556,0.1702,0.1702
1,0.6258,0.6523,0.5479,0.6154,0.5797,0.2445,0.2459
2,0.6387,0.6558,0.6027,0.6197,0.6111,0.2739,0.274
3,0.5548,0.5807,0.4189,0.5439,0.4733,0.0989,0.1014
4,0.5974,0.6533,0.5342,0.5821,0.5571,0.1893,0.1899
Mean,0.6008,0.6391,0.5304,0.5849,0.5554,0.1954,0.1963
Std,0.0296,0.0292,0.0605,0.0293,0.0457,0.0609,0.0603




Unnamed: 0,Description,Value
0,Session id,6754
1,Target,Closed_In_2Yrs
2,Target type,Binary
3,Original data shape,"(205, 14)"
4,Transformed data shape,"(205, 11)"
5,Transformed train set shape,"(143, 11)"
6,Transformed test set shape,"(62, 11)"
7,Numeric features,13
8,Preprocess,True
9,Imputation type,simple


Unnamed: 0,Model,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC,TT (Sec)
rf,Random Forest Classifier,0.6519,0.6577,0.8322,0.6873,0.7468,0.1888,0.2237,0.05
ada,Ada Boost Classifier,0.6581,0.6243,0.8078,0.7019,0.7462,0.2229,0.2553,0.012
gbc,Gradient Boosting Classifier,0.6248,0.6126,0.7433,0.6921,0.7106,0.1686,0.1743,0.012
knn,K Neighbors Classifier,0.6224,0.6108,0.7411,0.6974,0.7113,0.1572,0.1783,0.009
et,Extra Trees Classifier,0.6105,0.6059,0.7867,0.6712,0.7188,0.0907,0.0993,0.039
lightgbm,Light Gradient Boosting Machine,0.609,0.5897,0.7733,0.6707,0.7127,0.0959,0.1248,0.006
lda,Linear Discriminant Analysis,0.6229,0.5843,0.9378,0.6423,0.7602,-0.0015,-0.0009,0.004
dt,Decision Tree Classifier,0.5752,0.5417,0.6978,0.6654,0.673,0.0567,0.0707,0.005
qda,Quadratic Discriminant Analysis,0.6171,0.5269,0.94,0.6342,0.7546,-0.0139,0.0011,0.005
dummy,Dummy Classifier,0.6433,0.5,1.0,0.6433,0.7828,0.0,0.0,0.004


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.6667,0.5,1.0,0.6667,0.8,0.0,0.0
1,0.6667,0.5,1.0,0.6667,0.8,0.0,0.0
2,0.6,0.5,1.0,0.6,0.75,0.0,0.0
3,0.6429,0.5,1.0,0.6429,0.7826,0.0,0.0
4,0.6429,0.5,1.0,0.6429,0.7826,0.0,0.0
5,0.6429,0.5,1.0,0.6429,0.7826,0.0,0.0
6,0.6429,0.5,1.0,0.6429,0.7826,0.0,0.0
7,0.6429,0.5,1.0,0.6429,0.7826,0.0,0.0
8,0.6429,0.5,1.0,0.6429,0.7826,0.0,0.0
9,0.6429,0.5,1.0,0.6429,0.7826,0.0,0.0


Fitting 10 folds for each of 10 candidates, totalling 100 fits
Original model was better than the tuned model, hence it will be returned. NOTE: The display metrics are for the tuned model (not the original one).


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.6,0.57,0.7,0.7,0.7,0.1,0.1
1,0.3333,0.38,0.5,0.5,0.5,-0.5,-0.5
2,0.6,0.5926,0.8889,0.6154,0.7273,0.0625,0.0801
3,0.7857,0.5333,1.0,0.75,0.8571,0.4615,0.5477
4,0.6429,0.5111,0.8889,0.6667,0.7619,0.1026,0.1217
5,0.7143,0.6444,0.7778,0.7778,0.7778,0.3778,0.3778
6,0.6429,0.3556,0.8889,0.6667,0.7619,0.1026,0.1217
7,0.6429,0.6444,1.0,0.6429,0.7826,0.0,0.0
8,0.5714,0.2333,0.7778,0.6364,0.7,-0.0244,-0.0259
9,0.7143,0.7444,0.8889,0.7273,0.8,0.3171,0.3373


Fitting 10 folds for each of 10 candidates, totalling 100 fits
Original model was better than the tuned model, hence it will be returned. NOTE: The display metrics are for the tuned model (not the original one).


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.7333,0.81,0.8,0.8,0.8,0.4,0.4
1,0.4667,0.48,0.4,0.6667,0.5,0.0,0.0
2,0.7333,0.8704,0.8889,0.7273,0.8,0.4118,0.4308
3,0.7143,0.6444,1.0,0.6923,0.8182,0.2432,0.3721
4,0.6429,0.4889,0.8889,0.6667,0.7619,0.1026,0.1217
5,0.5714,0.8,0.5556,0.7143,0.625,0.1429,0.1491
6,0.6429,0.6444,0.8889,0.6667,0.7619,0.1026,0.1217
7,0.7857,0.8222,0.8889,0.8,0.8421,0.5116,0.5185
8,0.5,0.3889,0.6667,0.6,0.6316,-0.1395,-0.1414
9,0.7857,0.7556,0.8889,0.8,0.8421,0.5116,0.5185


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.5172,0.5447,0.5789,0.6471,0.6111,-0.0201,-0.0203
1,0.6552,0.7842,0.8421,0.6957,0.7619,0.157,0.1667
2,0.7241,0.6263,0.8889,0.7273,0.8,0.3696,0.3894
3,0.6786,0.7333,0.9444,0.68,0.7907,0.1711,0.2238
4,0.6071,0.5667,0.7778,0.6667,0.7179,0.0833,0.0861
Mean,0.6365,0.651,0.8064,0.6833,0.7363,0.1522,0.1691
Std,0.0705,0.0933,0.1262,0.0272,0.0688,0.1281,0.1373


Unnamed: 0,Description,Value
0,Session id,7663
1,Target,Closed_In_2Yrs
2,Target type,Binary
3,Original data shape,"(435, 22)"
4,Transformed data shape,"(435, 11)"
5,Transformed train set shape,"(304, 11)"
6,Transformed test set shape,"(131, 11)"
7,Numeric features,21
8,Preprocess,True
9,Imputation type,simple


Unnamed: 0,Model,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC,TT (Sec)
gbc,Gradient Boosting Classifier,0.589,0.6078,0.3159,0.4563,0.3626,0.0827,0.087,0.021
lightgbm,Light Gradient Boosting Machine,0.5856,0.5914,0.3735,0.4575,0.4063,0.0959,0.0986,0.009
ada,Ada Boost Classifier,0.612,0.5648,0.3848,0.5145,0.4188,0.145,0.1575,0.017
lda,Linear Discriminant Analysis,0.612,0.558,0.1212,0.5117,0.1867,0.0533,0.0765,0.005
rf,Random Forest Classifier,0.5956,0.5555,0.2644,0.4685,0.3292,0.0753,0.0833,0.058
qda,Quadratic Discriminant Analysis,0.4968,0.5171,0.3386,0.2778,0.2849,-0.0735,-0.0894,0.006
et,Extra Trees Classifier,0.5792,0.5136,0.3144,0.4568,0.3555,0.0645,0.0733,0.042
dt,Decision Tree Classifier,0.5296,0.5108,0.4182,0.4023,0.4049,0.02,0.0207,0.006
dummy,Dummy Classifier,0.6118,0.5,0.0,0.0,0.0,0.0,0.0,0.006
nb,Naive Bayes,0.5692,0.4914,0.075,0.1938,0.0797,-0.0515,-0.0829,0.005


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.6129,0.6842,0.0,0.0,0.0,0.0,0.0
1,0.6129,0.5965,0.0,0.0,0.0,0.0,0.0
2,0.6129,0.5658,0.0,0.0,0.0,0.0,0.0
3,0.6129,0.4693,0.0,0.0,0.0,0.0,0.0
4,0.6333,0.6029,0.0,0.0,0.0,0.0,0.0
5,0.6333,0.6364,0.0,0.0,0.0,0.0,0.0
6,0.6,0.4954,0.0,0.0,0.0,0.0,0.0
7,0.6,0.3056,0.0,0.0,0.0,0.0,0.0
8,0.6,0.4769,0.0,0.0,0.0,0.0,0.0
9,0.6,0.5208,0.0,0.0,0.0,0.0,0.0


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.6129,0.5,0.0,0.0,0.0,0.0,0.0
1,0.6129,0.5,0.0,0.0,0.0,0.0,0.0
2,0.6129,0.5,0.0,0.0,0.0,0.0,0.0
3,0.6129,0.5,0.0,0.0,0.0,0.0,0.0
4,0.6333,0.5,0.0,0.0,0.0,0.0,0.0
5,0.6333,0.5,0.0,0.0,0.0,0.0,0.0
6,0.6,0.5,0.0,0.0,0.0,0.0,0.0
7,0.6,0.5,0.0,0.0,0.0,0.0,0.0
8,0.6,0.5,0.0,0.0,0.0,0.0,0.0
9,0.6,0.5,0.0,0.0,0.0,0.0,0.0


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.6774,0.5351,0.1667,1.0,0.2857,0.1969,0.3304
1,0.5806,0.5329,0.0833,0.3333,0.1333,-0.0254,-0.0361
2,0.6129,0.4781,0.0833,0.5,0.1429,0.0363,0.0609
3,0.6129,0.4386,0.0,0.0,0.0,0.0,0.0
4,0.6333,0.5239,0.0909,0.5,0.1538,0.0462,0.0739
5,0.6667,0.5455,0.1818,0.6667,0.2857,0.1525,0.2075
6,0.6,0.4028,0.0,0.0,0.0,0.0,0.0
7,0.6,0.3565,0.0,0.0,0.0,0.0,0.0
8,0.6333,0.5,0.0833,1.0,0.1538,0.0984,0.2274
9,0.6333,0.4583,0.0833,1.0,0.1538,0.0984,0.2274


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.6557,0.6419,0.1304,0.75,0.2222,0.1244,0.2039
1,0.6066,0.5788,0.0417,0.5,0.0769,0.0174,0.0402
2,0.6066,0.487,0.0,0.0,0.0,0.0,0.0
3,0.6066,0.5,0.0,0.0,0.0,0.0,0.0
4,0.6167,0.3825,0.0,0.0,0.0,0.0,0.0
Mean,0.6184,0.518,0.0344,0.25,0.0598,0.0284,0.0488
Std,0.0191,0.088,0.0506,0.3162,0.0865,0.0485,0.0791





 50%|█████████████████████████████████████████████████████████████████████████████████████████████████████                                                                                                     | 1/2 [01:47<01:47, 107.09s/it][A

Unnamed: 0,Description,Value
0,Session id,1683
1,Target,Closed_In_2Yrs
2,Target type,Binary
3,Original data shape,"(828, 22)"
4,Transformed data shape,"(828, 11)"
5,Transformed train set shape,"(579, 11)"
6,Transformed test set shape,"(249, 11)"
7,Numeric features,21
8,Preprocess,True
9,Imputation type,simple


Unnamed: 0,Model,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC,TT (Sec)
qda,Quadratic Discriminant Analysis,0.4542,0.6001,0.2815,0.8442,0.4134,0.1014,0.1615,0.005
et,Extra Trees Classifier,0.6943,0.5767,0.9118,0.7259,0.8078,0.1024,0.1188,0.056
lda,Linear Discriminant Analysis,0.6995,0.568,0.9926,0.7031,0.8231,-0.0101,-0.0259,0.006
nb,Naive Bayes,0.6788,0.5651,0.9167,0.7111,0.8002,0.0348,0.0537,0.005
lightgbm,Light Gradient Boosting Machine,0.658,0.5493,0.8381,0.7213,0.775,0.0757,0.0819,0.013
rf,Random Forest Classifier,0.6943,0.543,0.9362,0.7166,0.8115,0.0677,0.0988,0.064
knn,K Neighbors Classifier,0.6303,0.5412,0.8015,0.7114,0.7528,0.0246,0.0252,0.011
ada,Ada Boost Classifier,0.651,0.5394,0.8629,0.7067,0.7763,0.012,0.0197,0.017
dt,Decision Tree Classifier,0.6045,0.539,0.6959,0.731,0.7121,0.0776,0.0786,0.006
gbc,Gradient Boosting Classifier,0.6649,0.5159,0.897,0.7063,0.79,0.0113,0.0171,0.033


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.6207,0.6542,0.625,0.7812,0.6944,0.2104,0.2196
1,0.6552,0.703,0.7561,0.7561,0.7561,0.1679,0.1679
2,0.6379,0.5093,0.7805,0.7273,0.7529,0.0787,0.0794
3,0.5,0.5201,0.5122,0.7,0.5915,-0.0145,-0.0157
4,0.431,0.4978,0.4634,0.6333,0.5352,-0.1544,-0.1673
5,0.5862,0.66,0.5854,0.7742,0.6667,0.1481,0.1584
6,0.6207,0.5811,0.6585,0.7714,0.7105,0.1704,0.1749
7,0.6379,0.665,0.7073,0.7632,0.7342,0.1692,0.1704
8,0.569,0.6607,0.6585,0.7105,0.6835,0.0109,0.011
9,0.5789,0.5941,0.625,0.7353,0.6757,0.0868,0.0891


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.6897,0.6181,1.0,0.6897,0.8163,0.0,0.0
1,0.7069,0.6514,1.0,0.7069,0.8283,0.0,0.0
2,0.7069,0.571,1.0,0.7069,0.8283,0.0,0.0
3,0.7069,0.5222,1.0,0.7069,0.8283,0.0,0.0
4,0.7069,0.4261,1.0,0.7069,0.8283,0.0,0.0
5,0.7069,0.6514,1.0,0.7069,0.8283,0.0,0.0
6,0.7069,0.5782,1.0,0.7069,0.8283,0.0,0.0
7,0.7069,0.6428,1.0,0.7069,0.8283,0.0,0.0
8,0.7069,0.5395,1.0,0.7069,0.8283,0.0,0.0
9,0.7018,0.5559,1.0,0.7018,0.8247,0.0,0.0


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.6897,0.5701,1.0,0.6897,0.8163,0.0,0.0
1,0.7069,0.5516,1.0,0.7069,0.8283,0.0,0.0
2,0.7069,0.6334,1.0,0.7069,0.8283,0.0,0.0
3,0.6897,0.5115,0.9756,0.7018,0.8163,-0.0337,-0.0853
4,0.7069,0.4161,1.0,0.7069,0.8283,0.0,0.0
5,0.7069,0.5057,1.0,0.7069,0.8283,0.0,0.0
6,0.7069,0.6141,1.0,0.7069,0.8283,0.0,0.0
7,0.7069,0.5201,1.0,0.7069,0.8283,0.0,0.0
8,0.7069,0.3931,1.0,0.7069,0.8283,0.0,0.0
9,0.7018,0.511,1.0,0.7018,0.8247,0.0,0.0


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.681,0.6533,0.9136,0.7115,0.8,0.0694,0.0851
1,0.5776,0.495,0.6585,0.72,0.6879,0.0386,0.0389
2,0.6121,0.5653,0.6707,0.7534,0.7097,0.1312,0.1332
3,0.6724,0.618,0.7805,0.7619,0.7711,0.1956,0.1958
4,0.6,0.5432,0.6914,0.7273,0.7089,0.0713,0.0715
Mean,0.6286,0.5749,0.7429,0.7348,0.7355,0.1012,0.1049
Std,0.0409,0.0556,0.0954,0.0195,0.0426,0.0559,0.0546


Unnamed: 0,Description,Value
0,Session id,7498
1,Target,Closed_In_2Yrs
2,Target type,Binary
3,Original data shape,"(203, 14)"
4,Transformed data shape,"(203, 11)"
5,Transformed train set shape,"(142, 11)"
6,Transformed test set shape,"(61, 11)"
7,Numeric features,13
8,Preprocess,True
9,Imputation type,simple


Unnamed: 0,Model,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC,TT (Sec)
gbc,Gradient Boosting Classifier,0.8381,0.8201,0.9394,0.8726,0.9041,0.3498,0.3684,0.013
rf,Random Forest Classifier,0.8452,0.8181,0.9659,0.8647,0.9111,0.3057,0.3293,0.044
et,Extra Trees Classifier,0.8667,0.81,0.9742,0.8788,0.9227,0.4266,0.4545,0.037
lightgbm,Light Gradient Boosting Machine,0.8243,0.7924,0.9402,0.8595,0.8965,0.2784,0.3022,0.006
ada,Ada Boost Classifier,0.8448,0.7561,0.9485,0.8745,0.9092,0.3638,0.388,0.012
dt,Decision Tree Classifier,0.7971,0.6811,0.8621,0.8912,0.872,0.3241,0.34,0.004
knn,K Neighbors Classifier,0.7957,0.6189,0.922,0.8423,0.8794,0.1634,0.1708,0.011
qda,Quadratic Discriminant Analysis,0.3819,0.5747,0.2826,0.849,0.4122,0.0404,0.0719,0.004
nb,Naive Bayes,0.2329,0.5431,0.0773,0.6667,0.136,0.0009,0.0126,0.005
lr,Logistic Regression,0.24,0.5076,0.0909,0.0833,0.087,0.0276,0.0284,0.025


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.8,0.8056,1.0,0.8,0.8889,0.0,0.0
1,0.8667,0.75,1.0,0.8571,0.9231,0.4444,0.5345
2,0.9286,0.875,1.0,0.9231,0.96,0.6316,0.6794
3,0.7857,0.8333,0.9167,0.8462,0.88,-0.1053,-0.1132
4,0.8571,0.9583,0.9167,0.9167,0.9167,0.4167,0.4167
5,0.8571,0.8333,0.9167,0.9167,0.9167,0.4167,0.4167
6,0.9286,0.8788,1.0,0.9167,0.9565,0.7586,0.7817
7,0.7857,0.7879,0.9091,0.8333,0.8696,0.2759,0.2843
8,0.8571,0.8182,1.0,0.8462,0.9167,0.44,0.5311
9,0.7857,0.6667,1.0,0.7857,0.88,0.0,0.0


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.8,0.5,1.0,0.8,0.8889,0.0,0.0
1,0.8,0.5,1.0,0.8,0.8889,0.0,0.0
2,0.8571,0.5,1.0,0.8571,0.9231,0.0,0.0
3,0.8571,0.5,1.0,0.8571,0.9231,0.0,0.0
4,0.8571,0.5,1.0,0.8571,0.9231,0.0,0.0
5,0.8571,0.5,1.0,0.8571,0.9231,0.0,0.0
6,0.7857,0.5,1.0,0.7857,0.88,0.0,0.0
7,0.7857,0.5,1.0,0.7857,0.88,0.0,0.0
8,0.7857,0.5,1.0,0.7857,0.88,0.0,0.0
9,0.7857,0.5,1.0,0.7857,0.88,0.0,0.0


Fitting 10 folds for each of 10 candidates, totalling 100 fits
Original model was better than the tuned model, hence it will be returned. NOTE: The display metrics are for the tuned model (not the original one).


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.8,0.7222,0.9167,0.8462,0.88,0.2857,0.2942
1,0.8667,0.7778,1.0,0.8571,0.9231,0.4444,0.5345
2,0.9286,0.7917,1.0,0.9231,0.96,0.6316,0.6794
3,0.7143,0.5,0.8333,0.8333,0.8333,-0.1667,-0.1667
4,0.7857,0.9167,0.9167,0.8462,0.88,-0.1053,-0.1132
5,0.9286,0.9167,0.9167,1.0,0.9565,0.7586,0.7817
6,0.9286,0.7879,1.0,0.9167,0.9565,0.7586,0.7817
7,0.7857,0.9091,0.7273,1.0,0.8421,0.5333,0.603
8,0.9286,0.8182,1.0,0.9167,0.9565,0.7586,0.7817
9,0.7857,0.8182,1.0,0.7857,0.88,0.0,0.0


Fitting 10 folds for each of 10 candidates, totalling 100 fits
Original model was better than the tuned model, hence it will be returned. NOTE: The display metrics are for the tuned model (not the original one).


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.8276,0.775,1.0,0.8276,0.9057,0.0,0.0
1,0.8621,0.8696,0.9565,0.88,0.9167,0.5207,0.5363
2,0.8571,0.913,1.0,0.8519,0.92,0.2911,0.4128
3,0.8571,0.7739,0.913,0.913,0.913,0.513,0.513
4,0.8571,0.8,1.0,0.8519,0.92,0.2911,0.4128
Mean,0.8522,0.8263,0.9739,0.8649,0.9151,0.3232,0.375
Std,0.0125,0.0556,0.0348,0.0293,0.0054,0.1905,0.1942


Unnamed: 0,Description,Value
0,Session id,6194
1,Target,Closed_In_2Yrs
2,Target type,Binary
3,Original data shape,"(505, 14)"
4,Transformed data shape,"(505, 11)"
5,Transformed train set shape,"(353, 11)"
6,Transformed test set shape,"(152, 11)"
7,Numeric features,13
8,Preprocess,True
9,Imputation type,simple


Unnamed: 0,Model,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC,TT (Sec)
rf,Random Forest Classifier,0.7394,0.6091,0.9575,0.7535,0.8429,0.1331,0.1827,0.056
lightgbm,Light Gradient Boosting Machine,0.7225,0.5829,0.9028,0.7622,0.8257,0.156,0.1738,0.008
et,Extra Trees Classifier,0.7339,0.5815,0.9458,0.7537,0.8384,0.1294,0.1654,0.044
gbc,Gradient Boosting Classifier,0.731,0.5741,0.93,0.7583,0.8346,0.1445,0.1703,0.021
knn,K Neighbors Classifier,0.6748,0.5674,0.8571,0.7401,0.7933,0.0368,0.0304,0.011
dt,Decision Tree Classifier,0.6602,0.5666,0.7711,0.7679,0.7669,0.1278,0.1325,0.005
lda,Linear Discriminant Analysis,0.7225,0.5563,0.9885,0.7286,0.8387,-0.0156,-0.0251,0.005
ada,Ada Boost Classifier,0.6915,0.5532,0.8875,0.7418,0.8075,0.052,0.0512,0.014
nb,Naive Bayes,0.4075,0.533,0.2934,0.7889,0.3327,0.0,0.0177,0.005
lr,Logistic Regression,0.7254,0.528,0.9923,0.7293,0.8406,-0.0102,-0.015,0.022


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.7222,0.4654,0.9615,0.7353,0.8333,0.0816,0.1203
1,0.75,0.5192,1.0,0.7429,0.8525,0.1383,0.2726
2,0.7222,0.4327,0.9231,0.75,0.8276,0.1509,0.1754
3,0.7714,0.76,1.0,0.7576,0.8621,0.2632,0.3892
4,0.7143,0.57,0.92,0.7419,0.8214,0.1463,0.1704
5,0.7714,0.5256,1.0,0.7647,0.8667,0.1566,0.2915
6,0.7429,0.641,0.9615,0.7576,0.8475,0.0974,0.1368
7,0.7429,0.5342,0.9615,0.7576,0.8475,0.0974,0.1368
8,0.7143,0.5983,0.9231,0.75,0.8276,0.0437,0.0534
9,0.7714,0.641,0.9231,0.8,0.8571,0.3,0.3203


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.7222,0.5577,1.0,0.7222,0.8387,0.0,0.0
1,0.7222,0.6808,1.0,0.7222,0.8387,0.0,0.0
2,0.7222,0.5231,1.0,0.7222,0.8387,0.0,0.0
3,0.7143,0.646,1.0,0.7143,0.8333,0.0,0.0
4,0.7143,0.476,1.0,0.7143,0.8333,0.0,0.0
5,0.7429,0.4915,1.0,0.7429,0.8525,0.0,0.0
6,0.7429,0.6688,1.0,0.7429,0.8525,0.0,0.0
7,0.7429,0.4615,1.0,0.7429,0.8525,0.0,0.0
8,0.7429,0.4786,1.0,0.7429,0.8525,0.0,0.0
9,0.7429,0.5321,1.0,0.7429,0.8525,0.0,0.0


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.7222,0.5808,1.0,0.7222,0.8387,0.0,0.0
1,0.7222,0.5269,1.0,0.7222,0.8387,0.0,0.0
2,0.7222,0.5558,1.0,0.7222,0.8387,0.0,0.0
3,0.7143,0.624,1.0,0.7143,0.8333,0.0,0.0
4,0.7143,0.49,1.0,0.7143,0.8333,0.0,0.0
5,0.7429,0.6838,1.0,0.7429,0.8525,0.0,0.0
6,0.7429,0.4658,1.0,0.7429,0.8525,0.0,0.0
7,0.7429,0.3803,1.0,0.7429,0.8525,0.0,0.0
8,0.7429,0.688,1.0,0.7429,0.8525,0.0,0.0
9,0.7429,0.4744,1.0,0.7429,0.8525,0.0,0.0


Fitting 10 folds for each of 10 candidates, totalling 100 fits
Original model was better than the tuned model, hence it will be returned. NOTE: The display metrics are for the tuned model (not the original one).


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.7324,0.5344,1.0,0.7324,0.8455,0.0,0.0
1,0.7042,0.5435,0.9423,0.7313,0.8235,-0.0068,-0.0097
2,0.7606,0.5607,1.0,0.7536,0.8595,0.147,0.2817
3,0.7571,0.4716,1.0,0.75,0.8571,0.1463,0.281
4,0.7571,0.7007,1.0,0.75,0.8571,0.1463,0.281
Mean,0.7423,0.5622,0.9885,0.7435,0.8486,0.0866,0.1668
Std,0.0215,0.0755,0.0231,0.0096,0.0134,0.0735,0.1402




Unnamed: 0,Description,Value
0,Session id,443
1,Target,Closed_In_2Yrs
2,Target type,Binary
3,Original data shape,"(65, 14)"
4,Transformed data shape,"(65, 11)"
5,Transformed train set shape,"(45, 11)"
6,Transformed test set shape,"(20, 11)"
7,Numeric features,13
8,Preprocess,True
9,Imputation type,simple


Unnamed: 0,Model,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC,TT (Sec)
gbc,Gradient Boosting Classifier,0.845,0.9375,0.9083,0.9,0.8943,0.5682,0.5781,0.009
rf,Random Forest Classifier,0.875,0.9,0.975,0.885,0.9214,0.6295,0.6362,0.042
et,Extra Trees Classifier,0.855,0.9,0.9417,0.8767,0.9024,0.5917,0.5917,0.036
ada,Ada Boost Classifier,0.83,0.8583,0.875,0.9,0.8779,0.5502,0.5586,0.011
lightgbm,Light Gradient Boosting Machine,0.785,0.8583,1.0,0.785,0.8738,0.2,0.2,0.005
dt,Decision Tree Classifier,0.775,0.7583,0.8167,0.8917,0.8362,0.4589,0.4821,0.005
knn,K Neighbors Classifier,0.785,0.6833,0.9083,0.8367,0.8566,0.3212,0.3356,0.01
lda,Linear Discriminant Analysis,0.705,0.6167,0.7417,0.7633,0.7329,0.3329,0.3529,0.005
lr,Logistic Regression,0.76,0.5417,0.9667,0.7667,0.8512,0.1167,0.1167,0.023
nb,Naive Bayes,0.5,0.5,0.4417,0.6133,0.4879,0.0765,0.0765,0.005


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.8,0.8333,1.0,0.75,0.8571,0.5455,0.6124
1,1.0,1.0,1.0,1.0,1.0,1.0,1.0
2,0.8,1.0,1.0,0.8,0.8889,0.0,0.0
3,1.0,1.0,1.0,1.0,1.0,1.0,1.0
4,1.0,1.0,1.0,1.0,1.0,1.0,1.0
5,0.75,1.0,1.0,0.75,0.8571,0.0,0.0
6,1.0,1.0,1.0,1.0,1.0,1.0,1.0
7,1.0,1.0,1.0,1.0,1.0,1.0,1.0
8,1.0,1.0,1.0,1.0,1.0,1.0,1.0
9,1.0,1.0,1.0,1.0,1.0,1.0,1.0


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.8,1.0,1.0,0.75,0.8571,0.5455,0.6124
1,0.8,0.8333,1.0,0.75,0.8571,0.5455,0.6124
2,0.6,0.5,0.75,0.75,0.75,-0.25,-0.25
3,1.0,1.0,1.0,1.0,1.0,1.0,1.0
4,1.0,1.0,1.0,1.0,1.0,1.0,1.0
5,0.75,0.6667,1.0,0.75,0.8571,0.0,0.0
6,1.0,1.0,1.0,1.0,1.0,1.0,1.0
7,1.0,1.0,1.0,1.0,1.0,1.0,1.0
8,1.0,1.0,1.0,1.0,1.0,1.0,1.0
9,1.0,1.0,1.0,1.0,1.0,1.0,1.0


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.6,0.3333,1.0,0.6,0.75,0.0,0.0
1,0.6,0.8333,0.6667,0.6667,0.6667,0.1667,0.1667
2,0.8,0.25,1.0,0.8,0.8889,0.0,0.0
3,1.0,1.0,1.0,1.0,1.0,1.0,1.0
4,0.8,1.0,1.0,0.8,0.8889,0.0,0.0
5,0.75,0.3333,1.0,0.75,0.8571,0.0,0.0
6,0.75,1.0,1.0,0.75,0.8571,0.0,0.0
7,1.0,1.0,1.0,1.0,1.0,1.0,1.0
8,1.0,1.0,1.0,1.0,1.0,1.0,1.0
9,1.0,1.0,1.0,1.0,1.0,1.0,1.0


Fitting 10 folds for each of 10 candidates, totalling 100 fits
Original model was better than the tuned model, hence it will be returned. NOTE: The display metrics are for the tuned model (not the original one).


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.5556,0.7222,0.8333,0.625,0.7143,-0.2,-0.25
1,0.8889,0.8889,1.0,0.8571,0.9231,0.7273,0.7559
2,0.8889,0.9286,1.0,0.875,0.9333,0.6087,0.6614
3,1.0,1.0,1.0,1.0,1.0,1.0,1.0
4,1.0,1.0,1.0,1.0,1.0,1.0,1.0
Mean,0.8667,0.9079,0.9667,0.8714,0.9141,0.6272,0.6335
Std,0.1633,0.1022,0.0667,0.1371,0.105,0.441,0.4615


Unnamed: 0,Description,Value
0,Session id,5557
1,Target,Closed_In_2Yrs
2,Target type,Binary
3,Original data shape,"(294, 22)"
4,Transformed data shape,"(294, 11)"
5,Transformed train set shape,"(205, 11)"
6,Transformed test set shape,"(89, 11)"
7,Numeric features,21
8,Preprocess,True
9,Imputation type,simple


Unnamed: 0,Model,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC,TT (Sec)
et,Extra Trees Classifier,0.7462,0.7212,0.8986,0.7871,0.8361,0.2603,0.2751,0.044
nb,Naive Bayes,0.6967,0.689,0.8114,0.7791,0.7855,0.2311,0.2568,0.005
rf,Random Forest Classifier,0.7514,0.6717,0.9452,0.7682,0.8458,0.2144,0.2604,0.056
lr,Logistic Regression,0.7117,0.6702,0.8257,0.7914,0.8032,0.2564,0.277,0.04
qda,Quadratic Discriminant Analysis,0.4838,0.6651,0.3362,0.8804,0.4781,0.1404,0.2102,0.006
lda,Linear Discriminant Analysis,0.7562,0.665,0.9124,0.7883,0.8438,0.2897,0.3255,0.005
gbc,Gradient Boosting Classifier,0.7371,0.6576,0.879,0.7853,0.8282,0.257,0.2765,0.015
lightgbm,Light Gradient Boosting Machine,0.6931,0.6521,0.8319,0.7676,0.7959,0.1575,0.1663,0.006
knn,K Neighbors Classifier,0.7314,0.6377,0.899,0.7719,0.8288,0.2103,0.2395,0.015
ada,Ada Boost Classifier,0.6402,0.6105,0.7776,0.7388,0.7537,0.0534,0.059,0.014


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.7143,0.5,1.0,0.7143,0.8333,0.0,0.0
1,0.7143,0.5,1.0,0.7143,0.8333,0.0,0.0
2,0.7143,0.5,1.0,0.7143,0.8333,0.0,0.0
3,0.7143,0.5,1.0,0.7143,0.8333,0.0,0.0
4,0.7143,0.5,1.0,0.7143,0.8333,0.0,0.0
5,0.75,0.5,1.0,0.75,0.8571,0.0,0.0
6,0.75,0.5,1.0,0.75,0.8571,0.0,0.0
7,0.75,0.5,1.0,0.75,0.8571,0.0,0.0
8,0.75,0.5,1.0,0.75,0.8571,0.0,0.0
9,0.7,0.5,1.0,0.7,0.8235,0.0,0.0


Fitting 10 folds for each of 10 candidates, totalling 100 fits
Original model was better than the tuned model, hence it will be returned. NOTE: The display metrics are for the tuned model (not the original one).


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.6667,0.7,0.8,0.75,0.7742,0.1404,0.1414
1,0.7143,0.6111,0.8667,0.7647,0.8125,0.2222,0.2301
2,0.7143,0.6167,0.8,0.8,0.8,0.3,0.3
3,0.8095,0.7333,1.0,0.7895,0.8824,0.4167,0.513
4,0.8095,0.7667,1.0,0.7895,0.8824,0.4167,0.513
5,0.75,0.6267,0.9333,0.7778,0.8485,0.1667,0.1925
6,0.7,0.8,0.7333,0.8462,0.7857,0.2941,0.3026
7,0.8,0.6533,0.9333,0.8235,0.875,0.3846,0.4042
8,0.85,0.6533,0.9333,0.875,0.9032,0.5714,0.5774
9,0.6,0.7024,0.7143,0.7143,0.7143,0.0476,0.0476


Fitting 10 folds for each of 10 candidates, totalling 100 fits


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.8571,0.8556,0.8667,0.9286,0.8966,0.6667,0.6708
1,0.5714,0.6667,0.6,0.75,0.6667,0.087,0.0913
2,0.6667,0.7111,0.6667,0.8333,0.7407,0.2899,0.3043
3,0.8095,0.8222,0.8667,0.8667,0.8667,0.5333,0.5333
4,0.7619,0.6667,0.8667,0.8125,0.8387,0.386,0.3889
5,0.9,0.8,0.9333,0.9333,0.9333,0.7333,0.7333
6,0.7,0.6267,0.7333,0.8462,0.7857,0.2941,0.3026
7,0.6,0.52,0.7333,0.7333,0.7333,-0.0667,-0.0667
8,0.75,0.68,0.8667,0.8125,0.8387,0.2857,0.2887
9,0.7,0.7024,0.7857,0.7857,0.7857,0.2857,0.2857


Fitting 10 folds for each of 10 candidates, totalling 100 fits
Original model was better than the tuned model, hence it will be returned. NOTE: The display metrics are for the tuned model (not the original one).


Unnamed: 0_level_0,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC
Fold,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
0,0.7561,0.7061,0.9,0.7941,0.8438,0.2979,0.3104
1,0.7805,0.7333,0.8667,0.8387,0.8525,0.4243,0.4252
2,0.7561,0.8424,0.9667,0.7632,0.8529,0.1929,0.2526
3,0.7073,0.6455,0.8667,0.7647,0.8125,0.1575,0.1641
4,0.7805,0.7356,0.8621,0.8333,0.8475,0.4566,0.4574
Mean,0.7561,0.7326,0.8924,0.7988,0.8418,0.3059,0.322
Std,0.0267,0.0638,0.0395,0.0324,0.015,0.1196,0.1085



100%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 2/2 [03:17<00:00, 98.57s/it][A
100%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 2/2 [06:29<00:00, 194.69s/it]


In [14]:
aggregated_result_path = EXP_RESULT_PATH / 'result.csv'

if not os.path.exists(aggregated_result_path) :
    exp_result.to_csv(aggregated_result_path)
    
exp_result

Unnamed: 0,Fold,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC,target,x_data_yaer,대분류,feature_selection
0,0,0.8294,0.5741,0.1212,0.2222,0.1569,0.0710,0.0750,Closed_In_1Yr,2018,제조업(10~34),"['순운전자본/자산총계', '매출채권', '비유동자산', '유형자산', '자본금',..."
1,1,0.8810,0.6657,0.1515,0.7143,0.2500,0.2140,0.2923,Closed_In_1Yr,2018,제조업(10~34),"['순운전자본/자산총계', '매출채권', '비유동자산', '유형자산', '자본금',..."
2,2,0.8889,0.7109,0.1515,1.0000,0.2632,0.2369,0.3665,Closed_In_1Yr,2018,제조업(10~34),"['순운전자본/자산총계', '매출채권', '비유동자산', '유형자산', '자본금',..."
3,3,0.8849,0.6781,0.1515,0.8333,0.2564,0.2252,0.3252,Closed_In_1Yr,2018,제조업(10~34),"['순운전자본/자산총계', '매출채권', '비유동자산', '유형자산', '자본금',..."
4,4,0.8645,0.6511,0.0625,0.3333,0.1053,0.0677,0.0966,Closed_In_1Yr,2018,제조업(10~34),"['순운전자본/자산총계', '매출채권', '비유동자산', '유형자산', '자본금',..."
...,...,...,...,...,...,...,...,...,...,...,...,...
2,2,0.7561,0.8424,0.9667,0.7632,0.8529,0.1929,0.2526,Closed_In_2Yrs,2019,건설업(41~42),"['매출채권', '비유동자산', '유형자산', '판매비와관리비', '기업순이익률(%..."
3,3,0.7073,0.6455,0.8667,0.7647,0.8125,0.1575,0.1641,Closed_In_2Yrs,2019,건설업(41~42),"['매출채권', '비유동자산', '유형자산', '판매비와관리비', '기업순이익률(%..."
4,4,0.7805,0.7356,0.8621,0.8333,0.8475,0.4566,0.4574,Closed_In_2Yrs,2019,건설업(41~42),"['매출채권', '비유동자산', '유형자산', '판매비와관리비', '기업순이익률(%..."
5,Mean,0.7561,0.7326,0.8924,0.7988,0.8418,0.3059,0.3220,Closed_In_2Yrs,2019,건설업(41~42),"['매출채권', '비유동자산', '유형자산', '판매비와관리비', '기업순이익률(%..."
