In [None]:
#numpy and pandas for data manipulation
import numpy as np
import pandas as pd

from sklearn.model_selection import KFold

from sklearn.model_selection import StratifiedKFold

from sklearn.ensemble import RandomForestClassifier

from sklearn.model_selection import cross_val_predict

from sklearn.preprocessing import StandardScaler
from sklearn.impute import SimpleImputer

from sklearn.model_selection import train_test_split
from sklearn import metrics

#sklearn preprocessing for dealing with categorical variables
from sklearn.preprocessing import LabelEncoder

from itertools import product


samples = pd.read_csv('preprocessed-75.csv')

# Create a label encoder object
le = LabelEncoder()
le_count = 0

# Iterate through the columns
for col in samples:
    if samples[col].dtype == 'bool':
        # If 2 or fewer unique categories
        if len(list(samples[col].unique())) <= 2:
            # Train on the training data
            le.fit(samples[col])
            # Transform 
            samples[col] = le.transform(samples[col])
            
            # Keep track of how many columns were label encoded
            le_count += 1
print('%d columns were label encoded.' % le_count)


train_label = samples['TARGET']
print(train_label)



# one-hot encoding of categorical variables
samples = pd.get_dummies(samples)
correlations = samples.corr()['TARGET'].abs().sort_values(ascending=False)
samples = samples.drop(columns = [250:].index.values.tolist())


In [None]:
train_label = samples['TARGET']
samples = samples.drop(columns=['TARGET'])
# Median imputation of missing values
imputer = SimpleImputer(strategy = 'median')

# Scale each feature to -1 and 1
scaler = StandardScaler()

# Fit on the training data
imputer.fit(samples)

# Transform both training and testing data
samples = imputer.transform(samples)

# Repeat with the scaler
scaler.fit(samples)
samples = scaler.transform(samples)

print('Training data shape: ', samples.shape)

In [42]:
x_train,x_test, y_train, y_test = train_test_split(samples, train_label, test_size=0.2)

In [46]:
tot_trees = [100, 200, 300, 400]
for tot_tree in tot_trees:
    kf = StratifiedKFold(n_splits=5, random_state=None, shuffle=False)
    random_forest = RandomForestClassifier(n_estimators = tot_tree, class_weight='balanced', random_state = 50, verbose = 1, n_jobs = -1)
    y_pred = cross_val_predict(estimator=random_forest, X=x_train, y=y_train, cv=kf)
    print("Number of trees - {}  roc - {}".format(tot_tree,metrics.roc_auc_score(y_train, y_pred)))

[Parallel(n_jobs=-1)]: Using backend LokyBackend with 8 concurrent workers.
[Parallel(n_jobs=-1)]: Done  34 tasks      | elapsed:   52.3s
[Parallel(n_jobs=-1)]: Done 100 out of 100 | elapsed:  1.8min finished
[Parallel(n_jobs=8)]: Using backend ThreadingBackend with 8 concurrent workers.
[Parallel(n_jobs=8)]: Done  34 tasks      | elapsed:    0.3s
[Parallel(n_jobs=8)]: Done 100 out of 100 | elapsed:    0.7s finished
[Parallel(n_jobs=-1)]: Using backend LokyBackend with 8 concurrent workers.
[Parallel(n_jobs=-1)]: Done  34 tasks      | elapsed:   41.9s
[Parallel(n_jobs=-1)]: Done 100 out of 100 | elapsed:  1.6min finished
[Parallel(n_jobs=8)]: Using backend ThreadingBackend with 8 concurrent workers.
[Parallel(n_jobs=8)]: Done  34 tasks      | elapsed:    0.2s
[Parallel(n_jobs=8)]: Done 100 out of 100 | elapsed:    0.6s finished
[Parallel(n_jobs=-1)]: Using backend LokyBackend with 8 concurrent workers.
[Parallel(n_jobs=-1)]: Done  34 tasks      | elapsed:   43.4s
[Parallel(n_jobs=-1)]:

Number of trees - 100  roc - 0.5009077843126325


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 8 concurrent workers.
[Parallel(n_jobs=-1)]: Done  34 tasks      | elapsed:   39.3s
[Parallel(n_jobs=-1)]: Done 184 tasks      | elapsed:  2.9min
[Parallel(n_jobs=-1)]: Done 200 out of 200 | elapsed:  3.1min finished
[Parallel(n_jobs=8)]: Using backend ThreadingBackend with 8 concurrent workers.
[Parallel(n_jobs=8)]: Done  34 tasks      | elapsed:    0.2s
[Parallel(n_jobs=8)]: Done 184 tasks      | elapsed:    1.2s
[Parallel(n_jobs=8)]: Done 200 out of 200 | elapsed:    1.3s finished
[Parallel(n_jobs=-1)]: Using backend LokyBackend with 8 concurrent workers.
[Parallel(n_jobs=-1)]: Done  34 tasks      | elapsed:   39.4s
[Parallel(n_jobs=-1)]: Done 184 tasks      | elapsed:  2.7min
[Parallel(n_jobs=-1)]: Done 200 out of 200 | elapsed:  2.9min finished
[Parallel(n_jobs=8)]: Using backend ThreadingBackend with 8 concurrent workers.
[Parallel(n_jobs=8)]: Done  34 tasks      | elapsed:    0.2s
[Parallel(n_jobs=8)]: Done 184 tasks      | e

Number of trees - 200  roc - 0.5006807409221178


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 8 concurrent workers.
[Parallel(n_jobs=-1)]: Done  34 tasks      | elapsed:   37.1s
[Parallel(n_jobs=-1)]: Done 184 tasks      | elapsed:  2.6min
[Parallel(n_jobs=-1)]: Done 300 out of 300 | elapsed:  4.2min finished
[Parallel(n_jobs=8)]: Using backend ThreadingBackend with 8 concurrent workers.
[Parallel(n_jobs=8)]: Done  34 tasks      | elapsed:    0.2s
[Parallel(n_jobs=8)]: Done 184 tasks      | elapsed:    1.1s
[Parallel(n_jobs=8)]: Done 300 out of 300 | elapsed:    1.8s finished
[Parallel(n_jobs=-1)]: Using backend LokyBackend with 8 concurrent workers.
[Parallel(n_jobs=-1)]: Done  34 tasks      | elapsed:   40.9s
[Parallel(n_jobs=-1)]: Done 184 tasks      | elapsed:  2.7min
[Parallel(n_jobs=-1)]: Done 300 out of 300 | elapsed:  4.5min finished
[Parallel(n_jobs=8)]: Using backend ThreadingBackend with 8 concurrent workers.
[Parallel(n_jobs=8)]: Done  34 tasks      | elapsed:    0.3s
[Parallel(n_jobs=8)]: Done 184 tasks      | e

KeyboardInterrupt: 

In [47]:
train_label.value_counts()

0    282682
1     24825
Name: TARGET, dtype: int64

In [53]:
print(correlations.head(200))

EXT_SOURCE_3                                            -0.178926
EXT_SOURCE_2                                            -0.160471
EXT_SOURCE_1                                            -0.155317
previous_NAME_CONTRACT_STATUS_Approved_mean             -0.063526
client_bureau_balance_STATUS_C_sum_mean                 -0.062954
                                                           ...   
client_credit_AMT_CREDIT_LIMIT_ACTUAL_mean_min          -0.009037
previous_NAME_SELLER_INDUSTRY_Industry_mean             -0.008887
client_cash_NAME_CONTRACT_STATUS_Active_sum_mean        -0.008667
previous_CHANNEL_TYPE_Channel of corporate sales_mean   -0.008606
previous_NAME_GOODS_CATEGORY_Medical Supplies_sum       -0.008592
Name: TARGET, Length: 200, dtype: float64


In [70]:
for val in correlations.abs().sort_values(ascending=False).index.values.tolist():
    print("{} : {}".format(val,correlations[val]))

TARGET : 1.0
EXT_SOURCE_3 : -0.17892627558435192
EXT_SOURCE_2 : -0.16047133450758758
EXT_SOURCE_1 : -0.15531709815567368
client_credit_CNT_DRAWINGS_CURRENT_max_min : 0.10064765816882223
bureau_DAYS_CREDIT_mean : 0.08973059094733742
client_credit_CNT_DRAWINGS_CURRENT_mean_mean : 0.08252014479100929
DAYS_BIRTH : 0.07824216003637195
previous_NAME_CONTRACT_STATUS_Refused_mean : 0.07768083802616721
bureau_CREDIT_ACTIVE_Active_mean : 0.07735592009728258
bureau_DAYS_CREDIT_min : 0.07524766201015329
DAYS_EMPLOYED : 0.07495658541678334
client_credit_AMT_INST_MIN_REGULARITY_mean_min : 0.073593888083776
bureau_DAYS_CREDIT_UPDATE_mean : 0.06892893766081801
client_bureau_balance_MONTHS_BALANCE_sum_min : 0.06807162991863505
bureau_CREDIT_ACTIVE_Active_sum : 0.06713227480456399
previous_NAME_CONTRACT_STATUS_Refused_sum : 0.06448718697572972
client_credit_AMT_RECIVABLE_min_min : 0.06360992390964873
previous_NAME_CONTRACT_STATUS_Approved_mean : -0.06352569361342807
client_bureau_balance_STATUS_C_sum_me

In [71]:
sorted_corr = correlations.abs().sort_values(ascending=False)

In [91]:
sorted_corr[250:].index.values.tolist()

['TARGET',
 'EXT_SOURCE_3',
 'EXT_SOURCE_2',
 'EXT_SOURCE_1',
 'client_credit_CNT_DRAWINGS_CURRENT_max_min',
 'bureau_DAYS_CREDIT_mean',
 'client_credit_CNT_DRAWINGS_CURRENT_mean_mean',
 'DAYS_BIRTH',
 'previous_NAME_CONTRACT_STATUS_Refused_mean',
 'bureau_CREDIT_ACTIVE_Active_mean',
 'bureau_DAYS_CREDIT_min',
 'DAYS_EMPLOYED',
 'client_credit_AMT_INST_MIN_REGULARITY_mean_min',
 'bureau_DAYS_CREDIT_UPDATE_mean',
 'client_bureau_balance_MONTHS_BALANCE_sum_min',
 'bureau_CREDIT_ACTIVE_Active_sum',
 'previous_NAME_CONTRACT_STATUS_Refused_sum',
 'client_credit_AMT_RECIVABLE_min_min',
 'previous_NAME_CONTRACT_STATUS_Approved_mean',
 'client_bureau_balance_STATUS_C_sum_mean',
 'client_credit_AMT_INST_MIN_REGULARITY_max_min',
 'previous_NAME_PRODUCT_TYPE_walk-in_sum',
 'client_bureau_balance_STATUS_1_mean_mean',
 'client_bureau_balance_STATUS_1_mean_max',
 'client_bureau_balance_STATUS_C_sum_max',
 'REGION_RATING_CLIENT',
 'client_credit_AMT_DRAWINGS_CURRENT_mean_min',
 'client_installments_A

In [93]:
df = pd.read_csv('preprocessed-75.csv').drop(columns=[sorted_corr[250:].index.values.tolist()])

KeyError: "[('OCCUPATION_TYPE_Core staff', 'client_credit_NAME_CONTRACT_STATUS_Completed_mean_sum', 'client_bureau_balance_MONTHS_BALANCE_max_min', 'bureau_CREDIT_TYPE_Car loan_mean', 'client_credit_AMT_CREDIT_LIMIT_ACTUAL_min_sum', 'bureau_AMT_CREDIT_SUM_mean', 'client_cash_NAME_CONTRACT_STATUS_Active_sum_sum', 'AMT_REQ_CREDIT_BUREAU_YEAR', 'client_cash_CNT_INSTALMENT_min_min', 'ORGANIZATION_TYPE_Construction', 'NAME_HOUSING_TYPE_Rented apartment', 'previous_NAME_SELLER_INDUSTRY_Clothing_sum', 'bureau_AMT_CREDIT_SUM_max', 'previous_DAYS_DECISION_sum', 'bureau_DAYS_ENDDATE_FACT_max', 'client_cash_NAME_CONTRACT_STATUS_Completed_mean_sum', 'OCCUPATION_TYPE_Sales staff', 'client_cash_NAME_CONTRACT_STATUS_Completed_mean_max', 'previous_AMT_CREDIT_min', 'client_cash_NAME_CONTRACT_STATUS_Completed_mean_min', 'NAME_FAMILY_STATUS_Widow', 'client_credit_AMT_PAYMENT_CURRENT_min_sum', 'previous_NAME_GOODS_CATEGORY_Consumer Electronics_mean', 'client_credit_CNT_DRAWINGS_ATM_CURRENT_min_sum', 'client_bureau_balance_STATUS_0_sum_sum', 'CNT_CHILDREN', 'ENTRANCES_AVG', 'previous_NAME_CASH_LOAN_PURPOSE_Other_mean', 'previous_NAME_CASH_LOAN_PURPOSE_Urgent needs_mean', 'previous_DAYS_FIRST_DUE_max', 'client_cash_CNT_INSTALMENT_FUTURE_min_min', 'client_bureau_balance_STATUS_5_mean_mean', 'client_bureau_balance_STATUS_5_mean_min', 'previous_CHANNEL_TYPE_Credit and cash offices_sum', 'previous_NAME_SELLER_INDUSTRY_Consumer electronics_sum', 'OCCUPATION_TYPE_Managers', 'previous_PRODUCT_COMBINATION_Cash_mean', 'client_bureau_balance_STATUS_2_mean_mean', 'COMMONAREA_AVG', 'client_cash_CNT_INSTALMENT_FUTURE_min_mean', 'previous_PRODUCT_COMBINATION_Cash Street: middle_mean', 'previous_CHANNEL_TYPE_Stone_sum', 'previous_NAME_GOODS_CATEGORY_Mobile_mean', 'previous_NAME_PRODUCT_TYPE_x-sell_mean', 'client_cash_CNT_INSTALMENT_FUTURE_mean_max', 'previous_PRODUCT_COMBINATION_Card X-Sell_sum', 'client_bureau_balance_STATUS_2_mean_max', 'client_cash_MONTHS_BALANCE_sum_sum', 'ORGANIZATION_TYPE_Transport: type 3', 'client_bureau_balance_STATUS_0_sum_min', 'client_bureau_balance_STATUS_3_mean_mean', 'client_installments_AMT_PAYMENT_sum_sum', 'client_bureau_balance_STATUS_3_sum_mean', 'previous_NAME_TYPE_SUITE_Children_sum', 'client_cash_NAME_CONTRACT_STATUS_Active_sum_min', 'previous_AMT_DOWN_PAYMENT_min', 'client_bureau_balance_STATUS_3_mean_max', 'bureau_CREDIT_ACTIVE_Sold_mean', 'client_installments_NUM_INSTALMENT_VERSION_sum_max', 'client_bureau_balance_STATUS_4_mean_max', 'client_credit_AMT_DRAWINGS_POS_CURRENT_sum_sum', 'previous_DAYS_DECISION_max', 'previous_NAME_TYPE_SUITE_Children_mean', 'client_bureau_balance_STATUS_4_sum_mean', 'client_bureau_balance_STATUS_4_mean_mean', 'previous_AMT_CREDIT_mean', 'previous_NAME_CASH_LOAN_PURPOSE_Payments on other loans_sum', 'previous_NAME_YIELD_GROUP_middle_mean', 'client_installments_NUM_INSTALMENT_NUMBER_mean_min', 'previous_NAME_TYPE_SUITE_Family_sum', 'client_bureau_balance_STATUS_4_mean_sum', 'client_bureau_balance_STATUS_3_mean_sum', 'previous_NAME_PORTFOLIO_Cash_sum', 'previous_PRODUCT_COMBINATION_Cash X-Sell: middle_mean', 'previous_NFLAG_INSURED_ON_APPROVAL_sum', 'client_installments_NUM_INSTALMENT_VERSION_sum_sum', 'client_bureau_balance_STATUS_4_sum_sum', 'bureau_AMT_ANNUITY_count', 'previous_NAME_SELLER_INDUSTRY_Construction_mean', 'client_credit_AMT_DRAWINGS_CURRENT_sum_sum', 'client_bureau_balance_STATUS_5_sum_min', 'client_bureau_balance_STATUS_4_sum_max', 'client_cash_NAME_CONTRACT_STATUS_Signed_mean_min', 'previous_WEEKDAY_APPR_PROCESS_START_THURSDAY_sum', 'previous_NAME_CASH_LOAN_PURPOSE_Car repairs_sum', 'previous_RATE_DOWN_PAYMENT_min', 'previous_CODE_REJECT_REASON_SCO_sum', 'OCCUPATION_TYPE_Security staff', 'client_bureau_balance_STATUS_X_sum_min', 'client_installments_AMT_PAYMENT_min_max', 'client_credit_CNT_DRAWINGS_CURRENT_min_sum', 'previous_WEEKDAY_APPR_PROCESS_START_MONDAY_sum', 'ANNUITY_INCOME_PERCENT', 'previous_PRODUCT_COMBINATION_POS mobile with interest_sum', 'client_cash_NAME_CONTRACT_STATUS_Signed_sum_min', 'previous_NAME_SELLER_INDUSTRY_Construction_sum', 'client_bureau_balance_STATUS_3_sum_sum', 'previous_NAME_CLIENT_TYPE_Refreshed_sum', 'bureau_AMT_CREDIT_SUM_sum', 'client_bureau_balance_STATUS_2_sum_sum', 'client_bureau_balance_STATUS_5_mean_sum', 'OCCUPATION_TYPE_High skill tech staff', 'client_bureau_balance_STATUS_5_mean_max', 'client_bureau_balance_STATUS_3_sum_max', 'ORGANIZATION_TYPE_School', 'client_installments_NUM_INSTALMENT_VERSION_sum_mean', 'client_installments_NUM_INSTALMENT_NUMBER_min_mean', 'NONLIVINGAREA_AVG', 'client_bureau_balance_STATUS_2_sum_mean', 'client_credit_CNT_DRAWINGS_POS_CURRENT_min_sum', 'client_installments_AMT_PAYMENT_mean_min', 'previous_NAME_CONTRACT_TYPE_XNA_sum', 'client_credit_AMT_DRAWINGS_POS_CURRENT_max_sum', 'previous_PRODUCT_COMBINATION_Cash Street: low_sum', 'client_cash_NAME_CONTRACT_STATUS_Completed_sum_min', 'AMT_ANNUITY', 'client_bureau_balance_MONTHS_BALANCE_max_sum', 'CREDIT_TERM', 'WALLSMATERIAL_MODE_Stone, brick', 'previous_WEEKDAY_APPR_PROCESS_START_TUESDAY_sum', 'previous_NAME_CASH_LOAN_PURPOSE_XNA_sum', 'client_credit_NAME_CONTRACT_STATUS_Sent proposal_mean_mean', 'previous_NAME_CASH_LOAN_PURPOSE_Building a house or an annex_sum', 'AMT_REQ_CREDIT_BUREAU_MON', 'client_cash_NAME_CONTRACT_STATUS_Returned to the store_sum_mean', 'previous_NAME_CASH_LOAN_PURPOSE_Payments on other loans_mean', 'previous_WEEKDAY_APPR_PROCESS_START_FRIDAY_sum', 'OCCUPATION_TYPE_Cooking staff', 'previous_NAME_CONTRACT_STATUS_Canceled_mean', 'previous_CODE_REJECT_REASON_SCO_mean', 'previous_CHANNEL_TYPE_Contact center_mean', 'client_cash_NAME_CONTRACT_STATUS_Active_mean_min', 'bureau_CREDIT_ACTIVE_Sold_sum', 'client_cash_NAME_CONTRACT_STATUS_Returned to the store_mean_mean', 'NAME_INCOME_TYPE_Commercial associate', 'client_credit_AMT_INST_MIN_REGULARITY_max_sum', 'previous_PRODUCT_COMBINATION_POS household with interest_sum', 'client_credit_AMT_DRAWINGS_ATM_CURRENT_max_sum', 'NAME_EDUCATION_TYPE_Lower secondary', 'previous_NFLAG_INSURED_ON_APPROVAL_min', 'FLAG_DOCUMENT_16', 'previous_NAME_CASH_LOAN_PURPOSE_Car repairs_mean', 'FLAG_DOCUMENT_13', 'previous_NAME_CASH_LOAN_PURPOSE_Medicine_sum', 'previous_NAME_TYPE_SUITE_Unaccompanied_mean', 'bureau_AMT_CREDIT_SUM_LIMIT_mean', 'previous_PRODUCT_COMBINATION_POS household with interest_mean', 'client_credit_CNT_DRAWINGS_POS_CURRENT_sum_sum', 'client_cash_NAME_CONTRACT_STATUS_Returned to the store_mean_max', 'FONDKAPREMONT_MODE_org spec account', 'FONDKAPREMONT_MODE_reg oper spec account', 'client_installments_NUM_INSTALMENT_VERSION_max_min', 'previous_WEEKDAY_APPR_PROCESS_START_WEDNESDAY_sum', 'previous_NAME_CASH_LOAN_PURPOSE_Buying a used car_sum', 'previous_NAME_GOODS_CATEGORY_Mobile_sum', 'client_credit_AMT_DRAWINGS_CURRENT_min_min', 'client_bureau_balance_STATUS_2_sum_max', 'LANDAREA_AVG', 'previous_CNT_PAYMENT_min', 'client_credit_AMT_DRAWINGS_ATM_CURRENT_min_sum', 'bureau_AMT_CREDIT_SUM_min', 'previous_DAYS_LAST_DUE_sum', 'previous_NFLAG_INSURED_ON_APPROVAL_max', 'previous_NAME_CASH_LOAN_PURPOSE_Building a house or an annex_mean', 'bureau_AMT_CREDIT_SUM_OVERDUE_max', 'ORGANIZATION_TYPE_Medicine', 'client_cash_NAME_CONTRACT_STATUS_Signed_mean_mean', 'client_bureau_balance_STATUS_3_sum_min', 'previous_CHANNEL_TYPE_Credit and cash offices_mean', 'ORGANIZATION_TYPE_Restaurant', 'previous_FLAG_LAST_APPL_PER_CONTRACT_N_sum', 'client_installments_AMT_PAYMENT_mean_max', 'client_bureau_balance_STATUS_5_sum_max', 'client_bureau_balance_STATUS_5_sum_sum', 'client_cash_NAME_CONTRACT_STATUS_Returned to the store_sum_min', 'previous_NAME_GOODS_CATEGORY_Construction Materials_mean', 'ORGANIZATION_TYPE_Military', 'previous_PRODUCT_COMBINATION_Card X-Sell_mean', 'previous_NAME_GOODS_CATEGORY_Construction Materials_sum', 'ORGANIZATION_TYPE_Police', 'previous_WEEKDAY_APPR_PROCESS_START_SUNDAY_mean', 'YEARS_BEGINEXPLUATATION_AVG', 'ORGANIZATION_TYPE_Industry: type 3', 'ORGANIZATION_TYPE_Bank', 'ORGANIZATION_TYPE_Security Ministries', 'FLAG_DOCUMENT_14', 'bureau_AMT_CREDIT_SUM_LIMIT_sum', 'WALLSMATERIAL_MODE_Monolithic', 'client_credit_AMT_DRAWINGS_ATM_CURRENT_sum_sum', 'CNT_FAM_MEMBERS', 'previous_CHANNEL_TYPE_Regional / Local_sum', 'previous_NAME_GOODS_CATEGORY_Medical Supplies_mean', 'previous_NAME_GOODS_CATEGORY_Audio/Video_sum', 'previous_NAME_CASH_LOAN_PURPOSE_Medicine_mean', 'client_bureau_balance_STATUS_4_sum_min', 'OBS_30_CNT_SOCIAL_CIRCLE', 'client_cash_NAME_CONTRACT_STATUS_Returned to the store_mean_sum', 'previous_CHANNEL_TYPE_Regional / Local_mean', 'client_credit_AMT_CREDIT_LIMIT_ACTUAL_mean_min', 'ORGANIZATION_TYPE_Trade: type 3', 'previous_NAME_SELLER_INDUSTRY_Industry_mean', 'client_cash_NAME_CONTRACT_STATUS_Returned to the store_mean_min', 'NAME_INCOME_TYPE_Unemployed', 'client_cash_CNT_INSTALMENT_FUTURE_min_max', 'previous_AMT_GOODS_PRICE_count', 'client_cash_NAME_CONTRACT_STATUS_Active_sum_mean', 'previous_NAME_CONTRACT_TYPE_XNA_mean', 'previous_CHANNEL_TYPE_Channel of corporate sales_mean', 'previous_NAME_GOODS_CATEGORY_Medical Supplies_sum', 'client_bureau_balance_STATUS_3_mean_min', 'previous_FLAG_LAST_APPL_PER_CONTRACT_N_mean', 'OCCUPATION_TYPE_Medicine staff', 'previous_WEEKDAY_APPR_PROCESS_START_SATURDAY_mean', 'previous_AMT_CREDIT_max', 'client_cash_NAME_CONTRACT_STATUS_Returned to the store_sum_sum', 'NAME_TYPE_SUITE_Unaccompanied', 'bureau_AMT_CREDIT_MAX_OVERDUE_count', 'NAME_TYPE_SUITE_Family', 'client_bureau_balance_STATUS_X_mean_sum', 'previous_NAME_CASH_LOAN_PURPOSE_Gasification / water supply_mean', 'ORGANIZATION_TYPE_Trade: type 7', 'bureau_CREDIT_DAY_OVERDUE_mean', 'previous_NAME_SELLER_INDUSTRY_Auto technology_sum', 'FLAG_DOCUMENT_8', 'client_cash_NAME_CONTRACT_STATUS_Active_mean_mean', 'client_credit_CNT_DRAWINGS_OTHER_CURRENT_max_sum', 'previous_NAME_CASH_LOAN_PURPOSE_Gasification / water supply_sum', 'FLAG_DOCUMENT_18', 'client_installments_AMT_PAYMENT_sum_min', 'WALLSMATERIAL_MODE_Wooden', 'client_credit_AMT_DRAWINGS_OTHER_CURRENT_sum_min', 'ORGANIZATION_TYPE_Agriculture', 'client_cash_NAME_CONTRACT_STATUS_Signed_sum_mean', 'OCCUPATION_TYPE_Waiters/barmen staff', 'CREDIT_INCOME_PERCENT', 'previous_NAME_GOODS_CATEGORY_Other_sum', 'ORGANIZATION_TYPE_University', 'previous_NAME_CASH_LOAN_PURPOSE_Purchase of electronic equipment_sum', 'bureau_CREDIT_DAY_OVERDUE_min', 'previous_NAME_CASH_LOAN_PURPOSE_Buying a used car_mean', 'ORGANIZATION_TYPE_Government', 'client_credit_CNT_DRAWINGS_ATM_CURRENT_max_sum', 'client_credit_AMT_PAYMENT_TOTAL_CURRENT_max_sum', 'previous_NAME_SELLER_INDUSTRY_Industry_sum', 'previous_NAME_GOODS_CATEGORY_Audio/Video_mean', 'ORGANIZATION_TYPE_Security', 'client_cash_NAME_CONTRACT_STATUS_Demand_mean_mean', 'previous_NAME_GOODS_CATEGORY_Tourism_sum', 'bureau_AMT_CREDIT_SUM_OVERDUE_mean', 'previous_DAYS_FIRST_DUE_sum', 'client_cash_SK_DPD_max_min', 'previous_NAME_PRODUCT_TYPE_XNA_sum', 'OCCUPATION_TYPE_Cleaning staff', 'client_cash_SK_DPD_mean_min', 'previous_CODE_REJECT_REASON_XNA_sum', 'REG_REGION_NOT_WORK_REGION', 'client_credit_CNT_DRAWINGS_ATM_CURRENT_sum_sum', 'previous_NAME_GOODS_CATEGORY_Tourism_mean', 'client_cash_CNT_INSTALMENT_FUTURE_min_sum', 'bureau_CREDIT_CURRENCY_currency 2_mean', 'WALLSMATERIAL_MODE_Block', 'previous_AMT_ANNUITY_sum', 'previous_DAYS_LAST_DUE_max', 'client_credit_SK_DPD_DEF_mean_mean', 'previous_NAME_CASH_LOAN_PURPOSE_Furniture_sum', 'FLAG_DOCUMENT_15', 'client_cash_SK_DPD_DEF_mean_mean', 'client_bureau_balance_STATUS_2_sum_min', 'client_credit_NAME_CONTRACT_STATUS_Signed_sum_min', 'previous_NAME_GOODS_CATEGORY_Homewares_mean', 'ORGANIZATION_TYPE_Industry: type 1', 'client_bureau_balance_STATUS_4_mean_min', 'client_cash_NAME_CONTRACT_STATUS_Amortized debt_mean_mean', 'previous_NAME_CASH_LOAN_PURPOSE_Everyday expenses_sum', 'FLAG_OWN_REALTY', 'previous_NAME_PORTFOLIO_Cash_mean', 'client_bureau_balance_STATUS_2_mean_min', 'previous_NAME_GOODS_CATEGORY_Homewares_sum', 'bureau_CREDIT_TYPE_Loan for working capital replenishment_sum', 'previous_NAME_GOODS_CATEGORY_Vehicles_sum', 'bureau_CREDIT_CURRENCY_currency 2_sum', 'ORGANIZATION_TYPE_Transport: type 4', 'client_cash_MONTHS_BALANCE_sum_max', 'client_cash_CNT_INSTALMENT_FUTURE_mean_sum', 'client_cash_NAME_CONTRACT_STATUS_Demand_mean_min', 'ORGANIZATION_TYPE_Trade: type 6', 'previous_WEEKDAY_APPR_PROCESS_START_MONDAY_mean', 'ORGANIZATION_TYPE_Kindergarten', 'previous_PRODUCT_COMBINATION_Cash X-Sell: middle_sum', 'previous_NAME_GOODS_CATEGORY_Medicine_mean', 'previous_NAME_SELLER_INDUSTRY_Auto technology_mean', 'REG_REGION_NOT_LIVE_REGION', 'client_cash_SK_DPD_DEF_min_mean', 'bureau_CREDIT_DAY_OVERDUE_max', 'client_cash_SK_DPD_min_min', 'ORGANIZATION_TYPE_Industry: type 12', 'client_cash_SK_DPD_mean_mean', 'previous_NAME_CASH_LOAN_PURPOSE_Wedding / gift / holiday_sum', 'FLAG_DOCUMENT_2', 'ORGANIZATION_TYPE_Industry: type 9', 'HOUSETYPE_MODE_specific housing', 'previous_NAME_TYPE_SUITE_Other_A_mean', 'NAME_EDUCATION_TYPE_Academic degree', 'previous_NAME_TYPE_SUITE_Spouse, partner_mean', 'WEEKDAY_APPR_PROCESS_START_MONDAY', 'client_bureau_balance_MONTHS_BALANCE_max_max', 'client_installments_AMT_INSTALMENT_max_mean', 'NAME_HOUSING_TYPE_Office apartment', 'previous_NAME_GOODS_CATEGORY_Photo / Cinema Equipment_sum', 'OCCUPATION_TYPE_Private service staff', 'client_cash_NAME_CONTRACT_STATUS_Amortized debt_mean_min', 'previous_NAME_CASH_LOAN_PURPOSE_Hobby_sum', 'NAME_TYPE_SUITE_Other_B', 'EMERGENCYSTATE_MODE_Yes', 'previous_WEEKDAY_APPR_PROCESS_START_FRIDAY_mean', 'bureau_AMT_CREDIT_SUM_LIMIT_min', 'previous_NAME_CASH_LOAN_PURPOSE_Business development_sum', 'previous_NAME_CASH_LOAN_PURPOSE_Buying a home_sum', 'previous_NAME_GOODS_CATEGORY_Other_mean', 'previous_NAME_CASH_LOAN_PURPOSE_Wedding / gift / holiday_mean', 'client_cash_NAME_CONTRACT_STATUS_Canceled_sum_sum', 'NAME_INCOME_TYPE_Maternity leave', 'client_cash_SK_DPD_DEF_min_min', 'WEEKDAY_APPR_PROCESS_START_TUESDAY', 'bureau_CREDIT_ACTIVE_Bad debt_mean', 'previous_NAME_CLIENT_TYPE_Repeater_mean', 'previous_NAME_SELLER_INDUSTRY_Tourism_mean', 'previous_NAME_GOODS_CATEGORY_Medicine_sum', 'bureau_CREDIT_TYPE_Loan for the purchase of equipment_sum', 'previous_DAYS_FIRST_DUE_mean', 'previous_NAME_CASH_LOAN_PURPOSE_Education_sum', 'previous_NAME_CASH_LOAN_PURPOSE_Buying a holiday home / land_mean', 'previous_NAME_YIELD_GROUP_middle_sum', 'previous_NAME_GOODS_CATEGORY_Computers_mean', 'previous_NAME_GOODS_CATEGORY_Photo / Cinema Equipment_mean', 'FLAG_DOCUMENT_9', 'client_credit_CNT_DRAWINGS_CURRENT_sum_sum', 'previous_NAME_GOODS_CATEGORY_Gardening_sum', 'previous_NAME_SELLER_INDUSTRY_Tourism_sum', 'previous_NAME_GOODS_CATEGORY_Gardening_mean', 'previous_NAME_CASH_LOAN_PURPOSE_Journey_sum', 'FLAG_DOCUMENT_11', 'previous_NAME_SELLER_INDUSTRY_MLM partners_mean', 'client_cash_NAME_CONTRACT_STATUS_Demand_sum_min', 'previous_CHANNEL_TYPE_Channel of corporate sales_sum', 'previous_NAME_CASH_LOAN_PURPOSE_XAP_sum', 'ORGANIZATION_TYPE_Industry: type 4', 'previous_WEEKDAY_APPR_PROCESS_START_WEDNESDAY_mean', 'previous_NAME_GOODS_CATEGORY_Auto Accessories_sum', 'bureau_CREDIT_ACTIVE_Bad debt_sum', 'previous_CODE_REJECT_REASON_XNA_mean', 'AMT_INCOME_TOTAL', 'bureau_CNT_CREDIT_PROLONG_max', 'previous_NAME_CASH_LOAN_PURPOSE_Hobby_mean', 'previous_PRODUCT_COMBINATION_POS other with interest_mean', 'client_installments_AMT_INSTALMENT_max_min', 'ORGANIZATION_TYPE_Services', 'client_installments_NUM_INSTALMENT_VERSION_min_max', 'ORGANIZATION_TYPE_Insurance', 'client_credit_AMT_DRAWINGS_POS_CURRENT_sum_min', 'ORGANIZATION_TYPE_Other', 'bureau_CREDIT_TYPE_Loan for business development_sum', 'FLAG_DOCUMENT_21', 'previous_NAME_GOODS_CATEGORY_Vehicles_mean', 'previous_NAME_CASH_LOAN_PURPOSE_Buying a holiday home / land_sum', 'client_cash_SK_DPD_DEF_mean_min', 'previous_NAME_GOODS_CATEGORY_Fitness_mean', 'client_credit_AMT_DRAWINGS_OTHER_CURRENT_sum_sum', 'previous_NAME_GOODS_CATEGORY_Jewelry_sum', 'previous_NAME_CASH_LOAN_PURPOSE_Education_mean', 'bureau_AMT_CREDIT_SUM_LIMIT_count', 'previous_WEEKDAY_APPR_PROCESS_START_SATURDAY_sum', 'ORGANIZATION_TYPE_Hotel', 'previous_NAME_CASH_LOAN_PURPOSE_Purchase of electronic equipment_mean', 'FLAG_DOCUMENT_17', 'ORGANIZATION_TYPE_Transport: type 1', 'client_cash_MONTHS_BALANCE_min_max', 'ORGANIZATION_TYPE_Realtor', 'NAME_HOUSING_TYPE_Municipal apartment', 'previous_CHANNEL_TYPE_Car dealer_sum', 'ORGANIZATION_TYPE_Cleaning', 'ORGANIZATION_TYPE_Culture', 'previous_WEEKDAY_APPR_PROCESS_START_THURSDAY_mean', 'client_credit_AMT_INST_MIN_REGULARITY_min_sum', 'client_credit_SK_DPD_mean_mean', 'previous_NAME_CLIENT_TYPE_XNA_sum', 'client_cash_SK_DPD_min_mean', 'client_credit_AMT_INST_MIN_REGULARITY_min_min', 'NONLIVINGAPARTMENTS_AVG', 'previous_NAME_CASH_LOAN_PURPOSE_Refusal to name the goal_sum', 'ORGANIZATION_TYPE_Business Entity Type 2', 'previous_CHANNEL_TYPE_Car dealer_mean', 'previous_SELLERPLACE_AREA_max', 'previous_NAME_GOODS_CATEGORY_Fitness_sum', 'ORGANIZATION_TYPE_Trade: type 2', 'previous_CODE_REJECT_REASON_VERIF_sum', 'bureau_CNT_CREDIT_PROLONG_mean', 'previous_NAME_GOODS_CATEGORY_Sport and Leisure_sum', 'previous_NAME_GOODS_CATEGORY_Auto Accessories_mean', 'previous_NAME_CASH_LOAN_PURPOSE_Money for a third person_sum', 'ORGANIZATION_TYPE_Electricity', 'bureau_CREDIT_CURRENCY_currency 3_sum', 'ORGANIZATION_TYPE_Industry: type 13', 'previous_NAME_GOODS_CATEGORY_Jewelry_mean', 'LIVE_REGION_NOT_WORK_REGION', 'NAME_EDUCATION_TYPE_Incomplete higher', 'previous_NAME_GOODS_CATEGORY_Insurance_mean', 'previous_NAME_SELLER_INDUSTRY_MLM partners_sum', 'bureau_CREDIT_CURRENCY_currency 3_mean', 'bureau_CREDIT_TYPE_Loan for business development_mean', 'client_installments_AMT_INSTALMENT_max_sum', 'previous_PRODUCT_COMBINATION_POS others without interest_sum', 'bureau_CREDIT_TYPE_Real estate loan_sum', 'AMT_REQ_CREDIT_BUREAU_DAY', 'previous_NAME_TYPE_SUITE_Other_A_sum', 'FLAG_DOCUMENT_4', 'FONDKAPREMONT_MODE_not specified', 'previous_PRODUCT_COMBINATION_POS mobile without interest_sum', 'NAME_TYPE_SUITE_Children', 'OCCUPATION_TYPE_HR staff', 'client_cash_NAME_CONTRACT_STATUS_Signed_sum_max', 'client_credit_AMT_INST_MIN_REGULARITY_sum_min', 'ORGANIZATION_TYPE_Trade: type 4', 'previous_WEEKDAY_APPR_PROCESS_START_SUNDAY_sum', 'previous_NAME_TYPE_SUITE_Unaccompanied_sum', 'previous_PRODUCT_COMBINATION_Cash Street: low_mean', 'previous_NAME_TYPE_SUITE_Other_B_mean', 'previous_PRODUCT_COMBINATION_POS mobile without interest_mean', 'bureau_AMT_ANNUITY_min', 'previous_NAME_PRODUCT_TYPE_x-sell_sum', 'client_credit_AMT_PAYMENT_TOTAL_CURRENT_min_min', 'bureau_AMT_CREDIT_MAX_OVERDUE_sum', 'bureau_CREDIT_TYPE_Unknown type of loan_mean', 'OCCUPATION_TYPE_Secretaries', 'OCCUPATION_TYPE_IT staff', 'previous_CODE_REJECT_REASON_SYSTEM_sum', 'WEEKDAY_APPR_PROCESS_START_SATURDAY', 'previous_NAME_GOODS_CATEGORY_Additional Service_mean', 'client_credit_NAME_CONTRACT_STATUS_Approved_mean_max', 'client_installments_NUM_INSTALMENT_NUMBER_min_min', 'bureau_AMT_CREDIT_MAX_OVERDUE_min', 'client_installments_AMT_INSTALMENT_max_max', 'NAME_INCOME_TYPE_Student', 'bureau_CREDIT_TYPE_Unknown type of loan_sum', 'previous_NAME_GOODS_CATEGORY_Education_mean', 'client_cash_NAME_CONTRACT_STATUS_Approved_sum_sum', 'bureau_AMT_CREDIT_SUM_DEBT_max', 'previous_NAME_TYPE_SUITE_Other_B_sum', 'previous_PRODUCT_COMBINATION_POS others without interest_mean', 'client_cash_NAME_CONTRACT_STATUS_Approved_sum_max', 'client_credit_CNT_DRAWINGS_OTHER_CURRENT_min_sum', 'client_cash_CNT_INSTALMENT_min_max', 'client_cash_NAME_CONTRACT_STATUS_Approved_mean_min', 'previous_NAME_CASH_LOAN_PURPOSE_Everyday expenses_mean', 'AMT_REQ_CREDIT_BUREAU_QRT', 'previous_CHANNEL_TYPE_Country-wide_sum', 'ORGANIZATION_TYPE_Industry: type 11', 'client_cash_NAME_CONTRACT_STATUS_Canceled_mean_sum', 'ORGANIZATION_TYPE_Industry: type 5', 'client_credit_NAME_CONTRACT_STATUS_Refused_mean_max', 'previous_NAME_SELLER_INDUSTRY_Jewelry_mean', 'bureau_CREDIT_TYPE_Real estate loan_mean', 'client_cash_NAME_CONTRACT_STATUS_Approved_sum_min', 'client_credit_AMT_DRAWINGS_OTHER_CURRENT_min_sum', 'previous_NAME_SELLER_INDUSTRY_Jewelry_sum', 'client_installments_DAYS_ENTRY_PAYMENT_sum_max', 'previous_NAME_TYPE_SUITE_Group of people_sum', 'bureau_CREDIT_TYPE_Another type of loan_mean', 'FLAG_EMAIL', 'client_credit_AMT_DRAWINGS_CURRENT_min_sum', 'WALLSMATERIAL_MODE_Mixed', 'bureau_CREDIT_CURRENCY_currency 4_sum', 'NAME_INCOME_TYPE_Businessman', 'previous_NAME_CLIENT_TYPE_XNA_mean', 'previous_NAME_CASH_LOAN_PURPOSE_Journey_mean', 'bureau_CREDIT_TYPE_Loan for working capital replenishment_mean', 'client_credit_AMT_DRAWINGS_OTHER_CURRENT_max_sum', 'previous_NAME_GOODS_CATEGORY_Computers_sum', 'FLAG_DOCUMENT_7', 'client_credit_AMT_DRAWINGS_POS_CURRENT_min_sum', 'ORGANIZATION_TYPE_Emergency', 'previous_NAME_GOODS_CATEGORY_Education_sum', 'NAME_TYPE_SUITE_Spouse, partner', 'WEEKDAY_APPR_PROCESS_START_WEDNESDAY', 'bureau_CREDIT_CURRENCY_currency 4_mean', 'ORGANIZATION_TYPE_Industry: type 8', 'previous_CHANNEL_TYPE_Country-wide_mean', 'FLAG_DOCUMENT_10', 'client_credit_AMT_PAYMENT_TOTAL_CURRENT_min_sum', 'client_cash_NAME_CONTRACT_STATUS_Signed_sum_sum', 'bureau_AMT_ANNUITY_mean', 'client_cash_NAME_CONTRACT_STATUS_Approved_mean_max', 'NAME_TYPE_SUITE_Other_A', 'FLAG_DOCUMENT_19', 'previous_NAME_CASH_LOAN_PURPOSE_Buying a new car_mean', 'client_credit_AMT_CREDIT_LIMIT_ACTUAL_min_min', 'previous_NAME_CASH_LOAN_PURPOSE_Business development_mean', 'ORGANIZATION_TYPE_Religion', 'client_cash_CNT_INSTALMENT_min_mean', 'previous_SELLERPLACE_AREA_min', 'previous_NAME_CASH_LOAN_PURPOSE_Furniture_mean', 'ORGANIZATION_TYPE_Mobile', 'previous_NAME_GOODS_CATEGORY_Direct Sales_mean', 'WEEKDAY_APPR_PROCESS_START_SUNDAY', 'ORGANIZATION_TYPE_Industry: type 2', 'WEEKDAY_APPR_PROCESS_START_FRIDAY', 'previous_NAME_CASH_LOAN_PURPOSE_Refusal to name the goal_mean', 'bureau_CREDIT_TYPE_Another type of loan_sum', 'NAME_FAMILY_STATUS_Separated', 'ORGANIZATION_TYPE_Industry: type 10', 'previous_NAME_GOODS_CATEGORY_Additional Service_sum', 'bureau_CREDIT_TYPE_Loan for purchase of shares (margin lending)_sum', 'ORGANIZATION_TYPE_Postal', 'bureau_AMT_ANNUITY_max', 'client_bureau_balance_STATUS_X_mean_max', 'client_cash_NAME_CONTRACT_STATUS_Canceled_sum_min', 'previous_NAME_TYPE_SUITE_Group of people_mean', 'client_bureau_balance_STATUS_X_mean_min', 'bureau_CREDIT_TYPE_Cash loan (non-earmarked)_sum', 'previous_NAME_CASH_LOAN_PURPOSE_Buying a garage_sum', 'previous_NAME_CASH_LOAN_PURPOSE_Buying a new car_sum', 'ORGANIZATION_TYPE_Trade: type 1', 'HOUSETYPE_MODE_terraced house', 'bureau_CREDIT_TYPE_Cash loan (non-earmarked)_mean', 'AMT_REQ_CREDIT_BUREAU_HOUR', 'client_cash_NAME_CONTRACT_STATUS_Canceled_mean_min', 'previous_NAME_CONTRACT_STATUS_Unused offer_mean', 'previous_NAME_GOODS_CATEGORY_Insurance_sum', 'previous_NAME_GOODS_CATEGORY_Weapon_mean', 'ORGANIZATION_TYPE_Trade: type 5', 'bureau_CREDIT_TYPE_Loan for purchase of shares (margin lending)_mean', 'client_credit_NAME_CONTRACT_STATUS_Demand_mean_min', 'ORGANIZATION_TYPE_Transport: type 2', 'AMT_REQ_CREDIT_BUREAU_WEEK', 'client_cash_NAME_CONTRACT_STATUS_XNA_mean_mean', 'previous_NAME_CASH_LOAN_PURPOSE_Buying a home_mean', 'FLAG_DOCUMENT_12', 'NAME_FAMILY_STATUS_Unknown', 'client_cash_NAME_CONTRACT_STATUS_Canceled_mean_max', 'previous_NAME_GOODS_CATEGORY_Sport and Leisure_mean', 'ORGANIZATION_TYPE_Telecom', 'client_cash_NAME_CONTRACT_STATUS_Approved_mean_mean', 'previous_NAME_CASH_LOAN_PURPOSE_Buying a garage_mean', 'previous_CODE_REJECT_REASON_VERIF_mean', 'previous_CODE_REJECT_REASON_SYSTEM_mean', 'ORGANIZATION_TYPE_Industry: type 6', 'bureau_AMT_CREDIT_SUM_DEBT_mean', 'WALLSMATERIAL_MODE_Others', 'client_cash_NAME_CONTRACT_STATUS_Signed_mean_max', 'client_credit_CNT_DRAWINGS_OTHER_CURRENT_mean_sum', 'bureau_CREDIT_TYPE_Interbank credit_mean', 'bureau_CREDIT_TYPE_Mobile operator loan_mean', 'client_installments_NUM_INSTALMENT_NUMBER_sum_min', 'previous_NAME_GOODS_CATEGORY_Animals_mean', 'FLAG_MOBIL', 'previous_NFLAG_INSURED_ON_APPROVAL_mean', 'previous_NAME_CONTRACT_STATUS_Unused offer_sum', 'client_credit_NAME_CONTRACT_STATUS_Signed_mean_min', 'client_cash_NAME_CONTRACT_STATUS_Completed_sum_mean', 'previous_PRODUCT_COMBINATION_POS other with interest_sum', 'ORGANIZATION_TYPE_Housing', 'NAME_TYPE_SUITE_Group of people', 'WEEKDAY_APPR_PROCESS_START_THURSDAY', 'client_cash_NAME_CONTRACT_STATUS_Completed_mean_mean', 'client_bureau_balance_STATUS_X_mean_mean', 'previous_NAME_TYPE_SUITE_Spouse, partner_sum', 'OCCUPATION_TYPE_Realty agents', 'client_cash_NAME_CONTRACT_STATUS_Approved_sum_mean', 'FLAG_CONT_MOBILE', 'previous_NAME_CASH_LOAN_PURPOSE_XNA_mean', 'client_installments_NUM_INSTALMENT_VERSION_sum_min', 'ORGANIZATION_TYPE_Business Entity Type 1', 'previous_WEEKDAY_APPR_PROCESS_START_TUESDAY_mean', 'FLAG_DOCUMENT_5', 'NAME_HOUSING_TYPE_Co-op apartment', 'previous_RATE_INTEREST_PRIMARY_sum', 'bureau_CREDIT_TYPE_Loan for the purchase of equipment_mean', 'previous_NAME_PAYMENT_TYPE_Non-cash from your account_mean', 'bureau_AMT_CREDIT_SUM_DEBT_min', 'previous_NAME_GOODS_CATEGORY_Weapon_sum', 'ORGANIZATION_TYPE_Legal Services', 'previous_NAME_GOODS_CATEGORY_Office Appliances_mean', 'previous_RATE_INTEREST_PRIVILEGED_sum', 'FLAG_DOCUMENT_20', 'previous_NAME_PAYMENT_TYPE_Cashless from the account of the employer_sum', 'previous_NAME_GOODS_CATEGORY_Office Appliances_sum', 'bureau_CNT_CREDIT_PROLONG_min', 'previous_NAME_CASH_LOAN_PURPOSE_Money for a third person_mean', 'ORGANIZATION_TYPE_Advertising', 'ORGANIZATION_TYPE_Industry: type 7', 'previous_NAME_PAYMENT_TYPE_Non-cash from your account_sum', 'previous_NAME_PAYMENT_TYPE_Cashless from the account of the employer_mean', 'previous_NAME_GOODS_CATEGORY_Direct Sales_sum', 'bureau_AMT_CREDIT_SUM_OVERDUE_min', 'previous_NAME_GOODS_CATEGORY_House Construction_mean', 'previous_NAME_GOODS_CATEGORY_House Construction_sum', 'client_credit_SK_DPD_min_mean', 'client_credit_SK_DPD_min_sum', 'client_cash_NAME_CONTRACT_STATUS_XNA_mean_min')] not found in axis"

In [66]:
len(df.columns)

729

In [65]:
len(random_forest.feature_importances_)

848