# **Libraries**

In [29]:
import pandas as pd
import numpy as np
import os
import sys

import functions
import importlib
importlib.reload(functions)

from feature_engine.selection import DropConstantFeatures
from feature_engine.imputation import ArbitraryNumberImputer

import warnings

# **Display**

In [2]:
%matplotlib inline

pd.options.display.max_rows = 300000
pd.options.display.max_columns = 999
pd.options.display.max_colwidth = 500

warnings.filterwarnings("ignore")
warnings.simplefilter(action="ignore", category=FutureWarning)

pd.set_option('display.max_rows', 200)

size = 20

# **Variables**

In [3]:
random_state = 101
target = 'TARGET'

# **Data**

## **Load Data**

In [13]:
app_train = pd.read_csv(
    r"C:\Users\Dell\Documents\AI\Risk\Data\application_train.csv",
    index_col=False
)

In [14]:
app_train.shape

(307511, 122)

## **Reduce Memory Usage**

In [9]:
app_train = functions.reduce_memory_usage(app_train)

Memory usage of dataframe is 286.23 MB
Memory usage after optimization is: 92.38 MB
Decreased by 67.7%


## **Impute Missing Data**

In [16]:
num_value = -99999

for col in app_train.select_dtypes(include=['float16', 'float32', 'float64']).columns:
    app_train[col].fillna(num_value, inplace=True)

In [17]:
cat_value = 'UNKNOWN'

for col in app_train.select_dtypes(include=['object']).columns:
    app_train[col].fillna(cat_value, inplace=True)

## **Drop Constant Features**

In [24]:
from feature_engine.selection import DropConstantFeatures

dcf = DropConstantFeatures(tol = 0.75)
dcf.fit_transform(app_train)

Unnamed: 0,SK_ID_CURR,CODE_GENDER,FLAG_OWN_CAR,FLAG_OWN_REALTY,CNT_CHILDREN,AMT_INCOME_TOTAL,AMT_CREDIT,AMT_ANNUITY,AMT_GOODS_PRICE,NAME_INCOME_TYPE,NAME_EDUCATION_TYPE,NAME_FAMILY_STATUS,REGION_POPULATION_RELATIVE,DAYS_BIRTH,DAYS_EMPLOYED,DAYS_REGISTRATION,DAYS_ID_PUBLISH,OWN_CAR_AGE,FLAG_PHONE,OCCUPATION_TYPE,CNT_FAM_MEMBERS,REGION_RATING_CLIENT,REGION_RATING_CLIENT_W_CITY,WEEKDAY_APPR_PROCESS_START,HOUR_APPR_PROCESS_START,ORGANIZATION_TYPE,EXT_SOURCE_1,EXT_SOURCE_2,EXT_SOURCE_3,APARTMENTS_AVG,BASEMENTAREA_AVG,YEARS_BEGINEXPLUATATION_AVG,YEARS_BUILD_AVG,COMMONAREA_AVG,ELEVATORS_AVG,ENTRANCES_AVG,FLOORSMAX_AVG,FLOORSMIN_AVG,LANDAREA_AVG,LIVINGAPARTMENTS_AVG,LIVINGAREA_AVG,NONLIVINGAPARTMENTS_AVG,NONLIVINGAREA_AVG,APARTMENTS_MODE,BASEMENTAREA_MODE,YEARS_BEGINEXPLUATATION_MODE,YEARS_BUILD_MODE,COMMONAREA_MODE,ELEVATORS_MODE,ENTRANCES_MODE,FLOORSMAX_MODE,FLOORSMIN_MODE,LANDAREA_MODE,LIVINGAPARTMENTS_MODE,LIVINGAREA_MODE,NONLIVINGAPARTMENTS_MODE,NONLIVINGAREA_MODE,APARTMENTS_MEDI,BASEMENTAREA_MEDI,YEARS_BEGINEXPLUATATION_MEDI,YEARS_BUILD_MEDI,COMMONAREA_MEDI,ELEVATORS_MEDI,ENTRANCES_MEDI,FLOORSMAX_MEDI,FLOORSMIN_MEDI,LANDAREA_MEDI,LIVINGAPARTMENTS_MEDI,LIVINGAREA_MEDI,NONLIVINGAPARTMENTS_MEDI,NONLIVINGAREA_MEDI,FONDKAPREMONT_MODE,HOUSETYPE_MODE,TOTALAREA_MODE,WALLSMATERIAL_MODE,EMERGENCYSTATE_MODE,OBS_30_CNT_SOCIAL_CIRCLE,OBS_60_CNT_SOCIAL_CIRCLE,DAYS_LAST_PHONE_CHANGE,FLAG_DOCUMENT_3,AMT_REQ_CREDIT_BUREAU_MON,AMT_REQ_CREDIT_BUREAU_QRT,AMT_REQ_CREDIT_BUREAU_YEAR
0,100002,M,N,Y,0,202500.0,406597.5,24700.5,351000.0,Working,Secondary / secondary special,Single / not married,0.018801,-9461,-637,-3648.0,-2120,-99999.0,1,Laborers,1.0,2,2,WEDNESDAY,10,Business Entity Type 3,0.083037,0.262949,0.139376,0.0247,0.0369,0.9722,0.6192,0.0143,0.00,0.0690,0.0833,0.1250,0.0369,0.0202,0.0190,0.0000,0.0000,0.0252,0.0383,0.9722,0.6341,0.0144,0.0000,0.0690,0.0833,0.1250,0.0377,0.0220,0.0198,0.0,0.0000,0.0250,0.0369,0.9722,0.6243,0.0144,0.00,0.0690,0.0833,0.1250,0.0375,0.0205,0.0193,0.0000,0.0000,reg oper account,block of flats,0.0149,"Stone, brick",No,2.0,2.0,-1134.0,1,0.0,0.0,1.0
1,100003,F,N,N,0,270000.0,1293502.5,35698.5,1129500.0,State servant,Higher education,Married,0.003541,-16765,-1188,-1186.0,-291,-99999.0,1,Core staff,2.0,1,1,MONDAY,11,School,0.311267,0.622246,-99999.000000,0.0959,0.0529,0.9851,0.7960,0.0605,0.08,0.0345,0.2917,0.3333,0.0130,0.0773,0.0549,0.0039,0.0098,0.0924,0.0538,0.9851,0.8040,0.0497,0.0806,0.0345,0.2917,0.3333,0.0128,0.0790,0.0554,0.0,0.0000,0.0968,0.0529,0.9851,0.7987,0.0608,0.08,0.0345,0.2917,0.3333,0.0132,0.0787,0.0558,0.0039,0.0100,reg oper account,block of flats,0.0714,Block,No,1.0,1.0,-828.0,1,0.0,0.0,0.0
2,100004,M,Y,Y,0,67500.0,135000.0,6750.0,135000.0,Working,Secondary / secondary special,Single / not married,0.010032,-19046,-225,-4260.0,-2531,26.0,1,Laborers,1.0,2,2,MONDAY,9,Government,-99999.000000,0.555912,0.729567,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.00,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.00,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,UNKNOWN,UNKNOWN,-99999.0000,UNKNOWN,UNKNOWN,0.0,0.0,-815.0,0,0.0,0.0,0.0
3,100006,F,N,Y,0,135000.0,312682.5,29686.5,297000.0,Working,Secondary / secondary special,Civil marriage,0.008019,-19005,-3039,-9833.0,-2437,-99999.0,0,Laborers,2.0,2,2,WEDNESDAY,17,Business Entity Type 3,-99999.000000,0.650442,-99999.000000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.00,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.00,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,UNKNOWN,UNKNOWN,-99999.0000,UNKNOWN,UNKNOWN,2.0,2.0,-617.0,1,-99999.0,-99999.0,-99999.0
4,100007,M,N,Y,0,121500.0,513000.0,21865.5,513000.0,Working,Secondary / secondary special,Single / not married,0.028663,-19932,-3038,-4311.0,-3458,-99999.0,0,Core staff,1.0,2,2,THURSDAY,11,Religion,-99999.000000,0.322738,-99999.000000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.00,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.00,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,UNKNOWN,UNKNOWN,-99999.0000,UNKNOWN,UNKNOWN,0.0,0.0,-1106.0,0,0.0,0.0,0.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
307506,456251,M,N,N,0,157500.0,254700.0,27558.0,225000.0,Working,Secondary / secondary special,Separated,0.032561,-9327,-236,-8456.0,-1982,-99999.0,0,Sales staff,1.0,1,1,THURSDAY,15,Services,0.145570,0.681632,-99999.000000,0.2021,0.0887,0.9876,0.8300,0.0202,0.22,0.1034,0.6042,0.2708,0.0594,0.1484,0.1965,0.0753,0.1095,0.1008,0.0172,0.9782,0.7125,0.0172,0.0806,0.0345,0.4583,0.0417,0.0094,0.0882,0.0853,0.0,0.0125,0.2040,0.0887,0.9876,0.8323,0.0203,0.22,0.1034,0.6042,0.2708,0.0605,0.1509,0.2001,0.0757,0.1118,reg oper account,block of flats,0.2898,"Stone, brick",No,0.0,0.0,-273.0,0,-99999.0,-99999.0,-99999.0
307507,456252,F,N,Y,0,72000.0,269550.0,12001.5,225000.0,Pensioner,Secondary / secondary special,Widow,0.025164,-20775,365243,-4388.0,-4090,-99999.0,1,UNKNOWN,1.0,2,2,MONDAY,8,XNA,-99999.000000,0.115992,-99999.000000,0.0247,0.0435,0.9727,0.6260,0.0022,0.00,0.1034,0.0833,0.1250,0.0579,0.0202,0.0257,0.0000,0.0000,0.0252,0.0451,0.9727,0.6406,0.0022,0.0000,0.1034,0.0833,0.1250,0.0592,0.0220,0.0267,0.0,0.0000,0.0250,0.0435,0.9727,0.6310,0.0022,0.00,0.1034,0.0833,0.1250,0.0589,0.0205,0.0261,0.0000,0.0000,reg oper account,block of flats,0.0214,"Stone, brick",No,0.0,0.0,0.0,1,-99999.0,-99999.0,-99999.0
307508,456253,F,N,Y,0,153000.0,677664.0,29979.0,585000.0,Working,Higher education,Separated,0.005002,-14966,-7921,-6737.0,-5150,-99999.0,0,Managers,1.0,3,3,THURSDAY,9,School,0.744026,0.535722,0.218859,0.1031,0.0862,0.9816,0.7484,0.0123,0.00,0.2069,0.1667,0.2083,-99999.0000,0.0841,0.9279,0.0000,0.0000,0.1050,0.0894,0.9816,0.7583,0.0124,0.0000,0.2069,0.1667,0.2083,-99999.0000,0.0918,0.9667,0.0,0.0000,0.1041,0.0862,0.9816,0.7518,0.0124,0.00,0.2069,0.1667,0.2083,-99999.0000,0.0855,0.9445,0.0000,0.0000,reg oper account,block of flats,0.7970,Panel,No,6.0,6.0,-1909.0,1,1.0,0.0,1.0
307509,456254,F,N,Y,0,171000.0,370107.0,20205.0,319500.0,Commercial associate,Secondary / secondary special,Married,0.005313,-11961,-4786,-2562.0,-931,-99999.0,0,Laborers,2.0,2,2,WEDNESDAY,9,Business Entity Type 1,-99999.000000,0.514163,0.661024,0.0124,-99999.0000,0.9771,-99999.0000,-99999.0000,-99999.00,0.0690,0.0417,-99999.0000,-99999.0000,-99999.0000,0.0061,-99999.0000,-99999.0000,0.0126,-99999.0000,0.9772,-99999.0000,-99999.0000,-99999.0000,0.0690,0.0417,-99999.0000,-99999.0000,-99999.0000,0.0063,-99999.0,-99999.0000,0.0125,-99999.0000,0.9771,-99999.0000,-99999.0000,-99999.00,0.0690,0.0417,-99999.0000,-99999.0000,-99999.0000,0.0062,-99999.0000,-99999.0000,UNKNOWN,block of flats,0.0086,"Stone, brick",No,0.0,0.0,-322.0,1,0.0,0.0,0.0


## **Impute Missing Data**

In [30]:
ani = ArbitraryNumberImputer(arbitrary_number=-99999)
ani.fit(app_train)
ani.transform(app_train)

Unnamed: 0,SK_ID_CURR,TARGET,NAME_CONTRACT_TYPE,CODE_GENDER,FLAG_OWN_CAR,FLAG_OWN_REALTY,CNT_CHILDREN,AMT_INCOME_TOTAL,AMT_CREDIT,AMT_ANNUITY,AMT_GOODS_PRICE,NAME_TYPE_SUITE,NAME_INCOME_TYPE,NAME_EDUCATION_TYPE,NAME_FAMILY_STATUS,NAME_HOUSING_TYPE,REGION_POPULATION_RELATIVE,DAYS_BIRTH,DAYS_EMPLOYED,DAYS_REGISTRATION,DAYS_ID_PUBLISH,OWN_CAR_AGE,FLAG_MOBIL,FLAG_EMP_PHONE,FLAG_WORK_PHONE,FLAG_CONT_MOBILE,FLAG_PHONE,FLAG_EMAIL,OCCUPATION_TYPE,CNT_FAM_MEMBERS,REGION_RATING_CLIENT,REGION_RATING_CLIENT_W_CITY,WEEKDAY_APPR_PROCESS_START,HOUR_APPR_PROCESS_START,REG_REGION_NOT_LIVE_REGION,REG_REGION_NOT_WORK_REGION,LIVE_REGION_NOT_WORK_REGION,REG_CITY_NOT_LIVE_CITY,REG_CITY_NOT_WORK_CITY,LIVE_CITY_NOT_WORK_CITY,ORGANIZATION_TYPE,EXT_SOURCE_1,EXT_SOURCE_2,EXT_SOURCE_3,APARTMENTS_AVG,BASEMENTAREA_AVG,YEARS_BEGINEXPLUATATION_AVG,YEARS_BUILD_AVG,COMMONAREA_AVG,ELEVATORS_AVG,ENTRANCES_AVG,FLOORSMAX_AVG,FLOORSMIN_AVG,LANDAREA_AVG,LIVINGAPARTMENTS_AVG,LIVINGAREA_AVG,NONLIVINGAPARTMENTS_AVG,NONLIVINGAREA_AVG,APARTMENTS_MODE,BASEMENTAREA_MODE,YEARS_BEGINEXPLUATATION_MODE,YEARS_BUILD_MODE,COMMONAREA_MODE,ELEVATORS_MODE,ENTRANCES_MODE,FLOORSMAX_MODE,FLOORSMIN_MODE,LANDAREA_MODE,LIVINGAPARTMENTS_MODE,LIVINGAREA_MODE,NONLIVINGAPARTMENTS_MODE,NONLIVINGAREA_MODE,APARTMENTS_MEDI,BASEMENTAREA_MEDI,YEARS_BEGINEXPLUATATION_MEDI,YEARS_BUILD_MEDI,COMMONAREA_MEDI,ELEVATORS_MEDI,ENTRANCES_MEDI,FLOORSMAX_MEDI,FLOORSMIN_MEDI,LANDAREA_MEDI,LIVINGAPARTMENTS_MEDI,LIVINGAREA_MEDI,NONLIVINGAPARTMENTS_MEDI,NONLIVINGAREA_MEDI,FONDKAPREMONT_MODE,HOUSETYPE_MODE,TOTALAREA_MODE,WALLSMATERIAL_MODE,EMERGENCYSTATE_MODE,OBS_30_CNT_SOCIAL_CIRCLE,DEF_30_CNT_SOCIAL_CIRCLE,OBS_60_CNT_SOCIAL_CIRCLE,DEF_60_CNT_SOCIAL_CIRCLE,DAYS_LAST_PHONE_CHANGE,FLAG_DOCUMENT_2,FLAG_DOCUMENT_3,FLAG_DOCUMENT_4,FLAG_DOCUMENT_5,FLAG_DOCUMENT_6,FLAG_DOCUMENT_7,FLAG_DOCUMENT_8,FLAG_DOCUMENT_9,FLAG_DOCUMENT_10,FLAG_DOCUMENT_11,FLAG_DOCUMENT_12,FLAG_DOCUMENT_13,FLAG_DOCUMENT_14,FLAG_DOCUMENT_15,FLAG_DOCUMENT_16,FLAG_DOCUMENT_17,FLAG_DOCUMENT_18,FLAG_DOCUMENT_19,FLAG_DOCUMENT_20,FLAG_DOCUMENT_21,AMT_REQ_CREDIT_BUREAU_HOUR,AMT_REQ_CREDIT_BUREAU_DAY,AMT_REQ_CREDIT_BUREAU_WEEK,AMT_REQ_CREDIT_BUREAU_MON,AMT_REQ_CREDIT_BUREAU_QRT,AMT_REQ_CREDIT_BUREAU_YEAR
0,100002,1,Cash loans,M,N,Y,0,202500.0,406597.5,24700.5,351000.0,Unaccompanied,Working,Secondary / secondary special,Single / not married,House / apartment,0.018801,-9461,-637,-3648.0,-2120,-99999.0,1,1,0,1,1,0,Laborers,1.0,2,2,WEDNESDAY,10,0,0,0,0,0,0,Business Entity Type 3,0.083037,0.262949,0.139376,0.0247,0.0369,0.9722,0.6192,0.0143,0.00,0.0690,0.0833,0.1250,0.0369,0.0202,0.0190,0.0000,0.0000,0.0252,0.0383,0.9722,0.6341,0.0144,0.0000,0.0690,0.0833,0.1250,0.0377,0.0220,0.0198,0.0,0.0000,0.0250,0.0369,0.9722,0.6243,0.0144,0.00,0.0690,0.0833,0.1250,0.0375,0.0205,0.0193,0.0000,0.0000,reg oper account,block of flats,0.0149,"Stone, brick",No,2.0,2.0,2.0,2.0,-1134.0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,1.0
1,100003,0,Cash loans,F,N,N,0,270000.0,1293502.5,35698.5,1129500.0,Family,State servant,Higher education,Married,House / apartment,0.003541,-16765,-1188,-1186.0,-291,-99999.0,1,1,0,1,1,0,Core staff,2.0,1,1,MONDAY,11,0,0,0,0,0,0,School,0.311267,0.622246,-99999.000000,0.0959,0.0529,0.9851,0.7960,0.0605,0.08,0.0345,0.2917,0.3333,0.0130,0.0773,0.0549,0.0039,0.0098,0.0924,0.0538,0.9851,0.8040,0.0497,0.0806,0.0345,0.2917,0.3333,0.0128,0.0790,0.0554,0.0,0.0000,0.0968,0.0529,0.9851,0.7987,0.0608,0.08,0.0345,0.2917,0.3333,0.0132,0.0787,0.0558,0.0039,0.0100,reg oper account,block of flats,0.0714,Block,No,1.0,0.0,1.0,0.0,-828.0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0
2,100004,0,Revolving loans,M,Y,Y,0,67500.0,135000.0,6750.0,135000.0,Unaccompanied,Working,Secondary / secondary special,Single / not married,House / apartment,0.010032,-19046,-225,-4260.0,-2531,26.0,1,1,1,1,1,0,Laborers,1.0,2,2,MONDAY,9,0,0,0,0,0,0,Government,-99999.000000,0.555912,0.729567,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.00,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.00,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,UNKNOWN,UNKNOWN,-99999.0000,UNKNOWN,UNKNOWN,0.0,0.0,0.0,0.0,-815.0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0
3,100006,0,Cash loans,F,N,Y,0,135000.0,312682.5,29686.5,297000.0,Unaccompanied,Working,Secondary / secondary special,Civil marriage,House / apartment,0.008019,-19005,-3039,-9833.0,-2437,-99999.0,1,1,0,1,0,0,Laborers,2.0,2,2,WEDNESDAY,17,0,0,0,0,0,0,Business Entity Type 3,-99999.000000,0.650442,-99999.000000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.00,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.00,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,UNKNOWN,UNKNOWN,-99999.0000,UNKNOWN,UNKNOWN,2.0,0.0,2.0,0.0,-617.0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,-99999.0,-99999.0,-99999.0,-99999.0,-99999.0,-99999.0
4,100007,0,Cash loans,M,N,Y,0,121500.0,513000.0,21865.5,513000.0,Unaccompanied,Working,Secondary / secondary special,Single / not married,House / apartment,0.028663,-19932,-3038,-4311.0,-3458,-99999.0,1,1,0,1,0,0,Core staff,1.0,2,2,THURSDAY,11,0,0,0,0,1,1,Religion,-99999.000000,0.322738,-99999.000000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.00,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.00,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,-99999.0000,UNKNOWN,UNKNOWN,-99999.0000,UNKNOWN,UNKNOWN,0.0,0.0,0.0,0.0,-1106.0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
307506,456251,0,Cash loans,M,N,N,0,157500.0,254700.0,27558.0,225000.0,Unaccompanied,Working,Secondary / secondary special,Separated,With parents,0.032561,-9327,-236,-8456.0,-1982,-99999.0,1,1,0,1,0,0,Sales staff,1.0,1,1,THURSDAY,15,0,0,0,0,0,0,Services,0.145570,0.681632,-99999.000000,0.2021,0.0887,0.9876,0.8300,0.0202,0.22,0.1034,0.6042,0.2708,0.0594,0.1484,0.1965,0.0753,0.1095,0.1008,0.0172,0.9782,0.7125,0.0172,0.0806,0.0345,0.4583,0.0417,0.0094,0.0882,0.0853,0.0,0.0125,0.2040,0.0887,0.9876,0.8323,0.0203,0.22,0.1034,0.6042,0.2708,0.0605,0.1509,0.2001,0.0757,0.1118,reg oper account,block of flats,0.2898,"Stone, brick",No,0.0,0.0,0.0,0.0,-273.0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,-99999.0,-99999.0,-99999.0,-99999.0,-99999.0,-99999.0
307507,456252,0,Cash loans,F,N,Y,0,72000.0,269550.0,12001.5,225000.0,Unaccompanied,Pensioner,Secondary / secondary special,Widow,House / apartment,0.025164,-20775,365243,-4388.0,-4090,-99999.0,1,0,0,1,1,0,UNKNOWN,1.0,2,2,MONDAY,8,0,0,0,0,0,0,XNA,-99999.000000,0.115992,-99999.000000,0.0247,0.0435,0.9727,0.6260,0.0022,0.00,0.1034,0.0833,0.1250,0.0579,0.0202,0.0257,0.0000,0.0000,0.0252,0.0451,0.9727,0.6406,0.0022,0.0000,0.1034,0.0833,0.1250,0.0592,0.0220,0.0267,0.0,0.0000,0.0250,0.0435,0.9727,0.6310,0.0022,0.00,0.1034,0.0833,0.1250,0.0589,0.0205,0.0261,0.0000,0.0000,reg oper account,block of flats,0.0214,"Stone, brick",No,0.0,0.0,0.0,0.0,0.0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,-99999.0,-99999.0,-99999.0,-99999.0,-99999.0,-99999.0
307508,456253,0,Cash loans,F,N,Y,0,153000.0,677664.0,29979.0,585000.0,Unaccompanied,Working,Higher education,Separated,House / apartment,0.005002,-14966,-7921,-6737.0,-5150,-99999.0,1,1,0,1,0,1,Managers,1.0,3,3,THURSDAY,9,0,0,0,0,1,1,School,0.744026,0.535722,0.218859,0.1031,0.0862,0.9816,0.7484,0.0123,0.00,0.2069,0.1667,0.2083,-99999.0000,0.0841,0.9279,0.0000,0.0000,0.1050,0.0894,0.9816,0.7583,0.0124,0.0000,0.2069,0.1667,0.2083,-99999.0000,0.0918,0.9667,0.0,0.0000,0.1041,0.0862,0.9816,0.7518,0.0124,0.00,0.2069,0.1667,0.2083,-99999.0000,0.0855,0.9445,0.0000,0.0000,reg oper account,block of flats,0.7970,Panel,No,6.0,0.0,6.0,0.0,-1909.0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1.0,0.0,0.0,1.0,0.0,1.0
307509,456254,1,Cash loans,F,N,Y,0,171000.0,370107.0,20205.0,319500.0,Unaccompanied,Commercial associate,Secondary / secondary special,Married,House / apartment,0.005313,-11961,-4786,-2562.0,-931,-99999.0,1,1,0,1,0,0,Laborers,2.0,2,2,WEDNESDAY,9,0,0,0,1,1,0,Business Entity Type 1,-99999.000000,0.514163,0.661024,0.0124,-99999.0000,0.9771,-99999.0000,-99999.0000,-99999.00,0.0690,0.0417,-99999.0000,-99999.0000,-99999.0000,0.0061,-99999.0000,-99999.0000,0.0126,-99999.0000,0.9772,-99999.0000,-99999.0000,-99999.0000,0.0690,0.0417,-99999.0000,-99999.0000,-99999.0000,0.0063,-99999.0,-99999.0000,0.0125,-99999.0000,0.9771,-99999.0000,-99999.0000,-99999.00,0.0690,0.0417,-99999.0000,-99999.0000,-99999.0000,0.0062,-99999.0000,-99999.0000,UNKNOWN,block of flats,0.0086,"Stone, brick",No,0.0,0.0,0.0,0.0,-322.0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0


In [31]:
cat_value = 'UNKNOWN'

for col in app_train.select_dtypes(include=['object']).columns:
    app_train[col].fillna(cat_value, inplace=True)