In [2]:
import regex as re
import gc
import time
import numpy as np
import pandas as pd
import pickle
import seaborn as sns
import matplotlib
%matplotlib inline
import matplotlib.pyplot as plt
from sklearn.model_selection import train_test_split
from sklearn.metrics import roc_auc_score
from sklearn.preprocessing import LabelEncoder
from sklearn.impute import SimpleImputer, KNNImputer
import warnings
warnings.filterwarnings("ignore")
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)

# Ordinal Encoding

In [2]:
def apply_ordinal_encoding(train_data, test_data, categorical_features):
    '''
    Apply ordinal encoding to categorical features in train and test data
    '''
    # Initialize the encoder
    encoder = OrdinalEncoder(handle_unknown='use_encoded_value', unknown_value=-1)
    
    # Fit the encoder on the train data
    encoder.fit(train_data[categorical_features])
    
    # Transform the train and test data using the encoder
    train_data_encoded = train_data.copy()
    train_data_encoded[categorical_features] = encoder.transform(train_data[categorical_features])
    
    test_data_encoded = test_data.copy()
    test_data_encoded[categorical_features] = encoder.transform(test_data[categorical_features])
    
    return train_data_encoded, test_data_encoded

In [3]:
def cat_num_features(df):
    
    '''
        Utility Function to get the names of Categorical Features and 
        Numerical Features of the given Dataset.
    '''
    
    catf = []
    numf = []
    
    catf = [
            'ProductCD', 'card1', 'card2', 'card3', 'card4', 'card5', 
            'card6', 'addr1', 'addr2', 'P_emaildomain', 'R_emaildomain', 'M1', 'M2', 
            'M3', 'M4', 'M5', 'M6', 'M7', 'M8', 'M9', 'DeviceType', 'DeviceInfo',
            'TransactionDW', 'card1_div_1000', 'card2_div_10', 'P_parent_domain', 
            'P_domain_name', 'P_top_level_domain', 'R_parent_domain', 'R_domain_name', 
            'R_top_level_domain', 'device_name', 'device_version', 'os_name', 'os_version', 
            # 'screen_width', 'screen_height', 'card_intr1', 'card_intr2', 'card1_addr1', 
            # 'card1_addr2', 'card2_addr1', 'card2_addr2', 'card3_addr1', 'card3_addr2', 
            # 'card5_addr1', 'card5_addr2', 'card6_addr1', 'card6_addr2', 'ProductCD_addr1', 
            # 'ProductCD_addr2', 'card1_ProductCD', 'card2_ProductCD', 'card5_ProductCD', 
            # 'card6_ProductCD', 'addr1_P_emaildomain', 'card1_P_emaildoman', 'card1_addr1_P_emaildomain',
            # 'uid1', 'uid2'
            ]

    catf+=['id_'+str(i) for i in range(12,39)]


    # Updating the Categorical Feature Names List based on the columns present in the dataframe
    catf = [feature for feature in catf if feature in df.columns]
    numf = [feature for feature in df.columns if feature not in catf and not feature == 'isFraud']
    
    return (catf, numf)  

In [9]:
def label_encode(X_train, X_test, catf):
  
  '''
    Utility Function to Encode Categorical Features.
  '''

  for f in catf:
    
    X_train[f] = X_train[f].astype(str)
    X_test[f] = X_test[f].astype(str)
    
    le = LabelEncoder()
    le.fit(X_train[f])
    mapping = dict(zip(le.classes_, le.transform(le.classes_)))
    X_train[f] = le.transform(X_train[f])
    
    # Manually Encoding the test and Test Dataset so as to avoid error for any category which is not present in train set
    
    # All the categories which are not present in train datset are encoded as -1    
    X_test[f] = [-1 if mapping.get(v, -1)==-1 else mapping[v] for v in X_test[f].values ]

  return (X_train, X_test)

In [4]:
%%time
train_data = pd.read_pickle('basic_fe_train.pkl')
test_data = pd.read_pickle('basic_fe_test.pkl')

CPU times: user 1.25 s, sys: 1.1 s, total: 2.35 s
Wall time: 2.59 s


In [69]:
test_data.head()

Unnamed: 0_level_0,TransactionDT,TransactionAmt,ProductCD,card1,card2,card3,card4,card5,card6,addr1,addr2,dist1,P_emaildomain,R_emaildomain,C1,C2,C4,C5,C6,C7,C9,C11,C12,C13,C14,D1,D2,D3,D4,D5,D6,D8,D9,D10,D11,D12,D13,D14,D15,M1,M2,M3,M4,M5,M6,M7,M8,M9,V1,V3,V4,V6,V8,V11,V13,V18,V20,V30,V36,V37,V40,V44,V47,V48,V52,V54,V60,V70,V76,V78,V80,V81,V82,V87,V91,V99,V127,V130,V131,V139,V147,V156,V165,V166,V169,V171,V173,V174,V175,V176,V180,V183,V185,V195,V198,V203,V205,V207,V209,V210,V215,V216,V220,V221,V223,V230,V234,V235,V238,V240,V241,V250,V252,V257,V258,V260,V262,V263,V264,V265,V268,V271,V274,V277,V282,V283,V289,V291,V303,V307,V310,V312,V315,id_01,id_02,id_03,id_04,id_05,id_06,id_09,id_10,id_11,id_12,id_13,id_15,id_16,id_17,id_19,id_20,id_28,id_29,id_30,id_33,id_35,id_36,id_37,DeviceType,DeviceInfo,TransactionHR,TransactionMT,TransactionDW,dollars,cents,P_parent_domain,P_domain_name,P_top_level_domain,card1_div_1000,card2_div_10,R_parent_domain,R_domain_name,R_top_level_domain,device_name,device_version,os_name,os_version
TransactionID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1,Unnamed: 95_level_1,Unnamed: 96_level_1,Unnamed: 97_level_1,Unnamed: 98_level_1,Unnamed: 99_level_1,Unnamed: 100_level_1,Unnamed: 101_level_1,Unnamed: 102_level_1,Unnamed: 103_level_1,Unnamed: 104_level_1,Unnamed: 105_level_1,Unnamed: 106_level_1,Unnamed: 107_level_1,Unnamed: 108_level_1,Unnamed: 109_level_1,Unnamed: 110_level_1,Unnamed: 111_level_1,Unnamed: 112_level_1,Unnamed: 113_level_1,Unnamed: 114_level_1,Unnamed: 115_level_1,Unnamed: 116_level_1,Unnamed: 117_level_1,Unnamed: 118_level_1,Unnamed: 119_level_1,Unnamed: 120_level_1,Unnamed: 121_level_1,Unnamed: 122_level_1,Unnamed: 123_level_1,Unnamed: 124_level_1,Unnamed: 125_level_1,Unnamed: 126_level_1,Unnamed: 127_level_1,Unnamed: 128_level_1,Unnamed: 129_level_1,Unnamed: 130_level_1,Unnamed: 131_level_1,Unnamed: 132_level_1,Unnamed: 133_level_1,Unnamed: 134_level_1,Unnamed: 135_level_1,Unnamed: 136_level_1,Unnamed: 137_level_1,Unnamed: 138_level_1,Unnamed: 139_level_1,Unnamed: 140_level_1,Unnamed: 141_level_1,Unnamed: 142_level_1,Unnamed: 143_level_1,Unnamed: 144_level_1,Unnamed: 145_level_1,Unnamed: 146_level_1,Unnamed: 147_level_1,Unnamed: 148_level_1,Unnamed: 149_level_1,Unnamed: 150_level_1,Unnamed: 151_level_1,Unnamed: 152_level_1,Unnamed: 153_level_1,Unnamed: 154_level_1,Unnamed: 155_level_1,Unnamed: 156_level_1,Unnamed: 157_level_1,Unnamed: 158_level_1,Unnamed: 159_level_1,Unnamed: 160_level_1,Unnamed: 161_level_1,Unnamed: 162_level_1,Unnamed: 163_level_1,Unnamed: 164_level_1,Unnamed: 165_level_1,Unnamed: 166_level_1,Unnamed: 167_level_1,Unnamed: 168_level_1,Unnamed: 169_level_1,Unnamed: 170_level_1,Unnamed: 171_level_1,Unnamed: 172_level_1,Unnamed: 173_level_1,Unnamed: 174_level_1,Unnamed: 175_level_1
3663549,18403224,31.95,-1,458,-1,-1,-1,-1,-1,-1,-1,1.0,-1,-1,6.0,6.0,0.0,3.0,4.0,0.0,6.0,5.0,1.0,115.0,6.0,419.0,419.0,27.0,398.0,27.0,,,,418.0,203.0,,,,409.0,-1,-1,-1,-1,-1,-1,-1,-1,-1,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,1.0,1.0,47.950001,47.950001,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,1.0,0.0,47.950001,47.950001,0.0,0.0,,,,,,,,,,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,0,0,0,31,95,-1,-1,-1,2,-1,-1,-1,-1,-1,-1,-1,-1
3663550,18403263,49.0,-1,7191,-1,-1,-1,-1,-1,-1,-1,4.0,-1,-1,3.0,2.0,0.0,0.0,1.0,0.0,2.0,1.0,1.0,12.0,2.0,149.0,149.0,7.0,634.0,7.0,,,,231.0,634.0,,,,634.0,-1,-1,-1,-1,-1,-1,-1,-1,-1,1.0,1.0,1.0,1.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,1.0,1.0,0.0,4.0,280.0,280.0,77.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,1.0,0.0,280.0,280.0,77.0,0.0,,,,,,,,,,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,0,1,0,49,0,-1,-1,-1,12,-1,-1,-1,-1,-1,-1,-1,-1
3663551,18403310,171.0,-1,7417,-1,-1,-1,-1,-1,-1,-1,2635.0,-1,-1,2.0,2.0,0.0,0.0,5.0,0.0,4.0,2.0,0.0,22.0,2.0,137.0,137.0,10.0,97.0,10.0,,,,136.0,136.0,,,,97.0,-1,-1,-1,-1,-1,-1,-1,-1,-1,1.0,1.0,1.0,1.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,2.0,2.0,0.0,0.0,1.0,1.0,0.0,3.0,968.0,705.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,2.0,0.0,1321.0,1058.0,0.0,0.0,,,,,,,,,,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,0,1,0,171,0,-1,-1,-1,12,-1,-1,-1,-1,-1,-1,-1,-1
3663552,18403310,284.95,-1,1101,-1,-1,-1,-1,-1,-1,-1,17.0,-1,-1,5.0,2.0,0.0,1.0,1.0,0.0,2.0,2.0,0.0,7.0,4.0,42.0,42.0,41.0,242.0,41.0,,,,242.0,242.0,,,,242.0,-1,-1,-1,-1,-1,-1,-1,-1,-1,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,1.0,1.0,2.0,2.0,0.0,2.0,2.0,1.0,0.0,1.0,0.0,1.0,1.0,1.0,0.0,0.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,282.540009,,,,,,,,,,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,0,1,0,284,95,-1,-1,-1,2,-1,-1,-1,-1,-1,-1,-1,-1
3663553,18403317,67.95,-1,-1,-1,-1,-1,-1,-1,-1,-1,6.0,-1,-1,6.0,6.0,0.0,2.0,5.0,0.0,5.0,6.0,0.0,14.0,6.0,22.0,22.0,0.0,22.0,0.0,,,,22.0,22.0,,,,22.0,-1,-1,-1,-1,-1,-1,-1,-1,-1,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,1.0,1.0,1.0,1.0,0.0,1.0,1.0,1.0,0.0,1.0,0.0,1.0,1.0,1.0,0.0,0.0,1.0,1.0,1.0,3.0,183.850006,183.850006,67.949997,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1.0,1.0,1.0,1.0,0.0,183.850006,183.850006,67.949997,67.949997,,,,,,,,,,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,0,1,0,67,95,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1


In [5]:
pd.__version__ 

'1.5.2'

In [6]:
train_data.head()

Unnamed: 0_level_0,isFraud,TransactionDT,TransactionAmt,ProductCD,card1,card2,card3,card4,card5,card6,addr1,addr2,dist1,P_emaildomain,R_emaildomain,C1,C2,C4,C5,C6,C7,C9,C11,C12,C13,C14,D1,D2,D3,D4,D5,D6,D8,D9,D10,D11,D12,D13,D14,D15,M1,M2,M3,M4,M5,M6,M7,M8,M9,V1,V3,V4,V6,V8,V11,V13,V18,V20,V30,V36,V37,V40,V44,V47,V48,V52,V54,V60,V70,V76,V78,V80,V81,V82,V87,V91,V99,V127,V130,V131,V139,V147,V156,V165,V166,V169,V171,V173,V174,V175,V176,V180,V183,V185,V195,V198,V203,V205,V207,V209,V210,V215,V216,V220,V221,V223,V230,V234,V235,V238,V240,V241,V250,V252,V257,V258,V260,V262,V263,V264,V265,V268,V271,V274,V277,V282,V283,V289,V291,V303,V307,V310,V312,V315,id_01,id_02,id_03,id_04,id_05,id_06,id_09,id_10,id_11,id_12,id_13,id_15,id_16,id_17,id_19,id_20,id_28,id_29,id_30,id_33,id_35,id_36,id_37,DeviceType,DeviceInfo,TransactionHR,TransactionMT,TransactionDW,dollars,cents,P_parent_domain,P_domain_name,P_top_level_domain,card1_div_1000,card2_div_10,R_parent_domain,R_domain_name,R_top_level_domain,device_name,device_version,os_name,os_version
TransactionID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1,Unnamed: 95_level_1,Unnamed: 96_level_1,Unnamed: 97_level_1,Unnamed: 98_level_1,Unnamed: 99_level_1,Unnamed: 100_level_1,Unnamed: 101_level_1,Unnamed: 102_level_1,Unnamed: 103_level_1,Unnamed: 104_level_1,Unnamed: 105_level_1,Unnamed: 106_level_1,Unnamed: 107_level_1,Unnamed: 108_level_1,Unnamed: 109_level_1,Unnamed: 110_level_1,Unnamed: 111_level_1,Unnamed: 112_level_1,Unnamed: 113_level_1,Unnamed: 114_level_1,Unnamed: 115_level_1,Unnamed: 116_level_1,Unnamed: 117_level_1,Unnamed: 118_level_1,Unnamed: 119_level_1,Unnamed: 120_level_1,Unnamed: 121_level_1,Unnamed: 122_level_1,Unnamed: 123_level_1,Unnamed: 124_level_1,Unnamed: 125_level_1,Unnamed: 126_level_1,Unnamed: 127_level_1,Unnamed: 128_level_1,Unnamed: 129_level_1,Unnamed: 130_level_1,Unnamed: 131_level_1,Unnamed: 132_level_1,Unnamed: 133_level_1,Unnamed: 134_level_1,Unnamed: 135_level_1,Unnamed: 136_level_1,Unnamed: 137_level_1,Unnamed: 138_level_1,Unnamed: 139_level_1,Unnamed: 140_level_1,Unnamed: 141_level_1,Unnamed: 142_level_1,Unnamed: 143_level_1,Unnamed: 144_level_1,Unnamed: 145_level_1,Unnamed: 146_level_1,Unnamed: 147_level_1,Unnamed: 148_level_1,Unnamed: 149_level_1,Unnamed: 150_level_1,Unnamed: 151_level_1,Unnamed: 152_level_1,Unnamed: 153_level_1,Unnamed: 154_level_1,Unnamed: 155_level_1,Unnamed: 156_level_1,Unnamed: 157_level_1,Unnamed: 158_level_1,Unnamed: 159_level_1,Unnamed: 160_level_1,Unnamed: 161_level_1,Unnamed: 162_level_1,Unnamed: 163_level_1,Unnamed: 164_level_1,Unnamed: 165_level_1,Unnamed: 166_level_1,Unnamed: 167_level_1,Unnamed: 168_level_1,Unnamed: 169_level_1,Unnamed: 170_level_1,Unnamed: 171_level_1,Unnamed: 172_level_1,Unnamed: 173_level_1,Unnamed: 174_level_1,Unnamed: 175_level_1,Unnamed: 176_level_1
2987000,0,86400,68.5,W,13926,,150.0,discover,142.0,credit,315.0,87.0,19.0,,,1.0,1.0,0.0,0.0,1.0,0.0,1.0,2.0,0.0,1.0,1.0,14.0,,13.0,,,,,,13.0,13.0,,,,0.0,T,T,T,M2,F,T,,,,1.0,1.0,1.0,1.0,1.0,0.0,1.0,0.0,1.0,0.0,,,,,,,,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,117.0,0.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1.0,1.0,0.0,1.0,0.0,117.0,0.0,0.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,0,0,5,68,5,,,,13,,,,,,,,
2987001,0,86401,29.0,W,2755,404.0,150.0,mastercard,102.0,credit,325.0,87.0,,gmail.com,,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,1.0,1.0,0.0,,,0.0,,,,,0.0,,,,,0.0,,,,M0,T,T,,,,,,,,,,0.0,0.0,1.0,0.0,0.0,1.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,0,0,5,29,0,google,gmail,com,2,40.0,,,,,,,
2987002,0,86469,59.0,W,4663,490.0,150.0,visa,166.0,debit,330.0,87.0,287.0,outlook.com,,1.0,1.0,0.0,0.0,1.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,,,0.0,,,,,0.0,315.0,,,,315.0,T,T,T,M0,F,F,F,F,F,1.0,1.0,1.0,1.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,0,1,5,59,0,microsoft,outlook,com,4,49.0,,,,,,,
2987003,0,86499,50.0,W,18132,567.0,150.0,mastercard,117.0,debit,476.0,87.0,,yahoo.com,,2.0,5.0,0.0,0.0,4.0,0.0,1.0,1.0,0.0,25.0,1.0,112.0,112.0,0.0,94.0,0.0,,,,84.0,,,,,111.0,,,,M0,T,F,,,,,,,,,,1.0,0.0,1.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,1.0,1.0,0.0,10.0,1758.0,354.0,135.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,1.0,0.0,1758.0,354.0,135.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,0,1,5,50,0,yahoo,yahoo,com,18,56.0,,,,,,,
2987004,0,86506,50.0,H,4497,514.0,150.0,mastercard,102.0,credit,420.0,87.0,,gmail.com,,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,1.0,1.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5155.0,2840.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,70787.0,,,,,,,100.0,NotFound,,New,NotFound,166.0,542.0,144.0,New,NotFound,Android 7.0,2220x1080,T,F,T,mobile,SAMSUNG SM-G892A Build/NRD90M,0,1,5,50,0,google,gmail,com,4,51.0,,,,Samsung,NRD90M,Android,7.0


In [10]:
catf, numf = cat_num_features(train_data)

# Data Prep

In [11]:
X_train = train_data.drop(['isFraud'], axis=1)
y_train = train_data['isFraud']

X_test = test_data

In [12]:
del train_data, test_data

In [13]:
# Storing Categorical and Numerical Feature Names 

catf, numf = cat_num_features(X_train)

In [14]:
# Encoding the Categorical Features

X_train[catf] = X_train[catf].fillna('missing')
X_test[catf] = X_test[catf].fillna('missing')

X_train, X_test = label_encode(X_train, X_test, catf)

In [15]:
X_train.head()

Unnamed: 0_level_0,TransactionDT,TransactionAmt,ProductCD,card1,card2,card3,card4,card5,card6,addr1,addr2,dist1,P_emaildomain,R_emaildomain,C1,C2,C4,C5,C6,C7,C9,C11,C12,C13,C14,D1,D2,D3,D4,D5,D6,D8,D9,D10,D11,D12,D13,D14,D15,M1,M2,M3,M4,M5,M6,M7,M8,M9,V1,V3,V4,V6,V8,V11,V13,V18,V20,V30,V36,V37,V40,V44,V47,V48,V52,V54,V60,V70,V76,V78,V80,V81,V82,V87,V91,V99,V127,V130,V131,V139,V147,V156,V165,V166,V169,V171,V173,V174,V175,V176,V180,V183,V185,V195,V198,V203,V205,V207,V209,V210,V215,V216,V220,V221,V223,V230,V234,V235,V238,V240,V241,V250,V252,V257,V258,V260,V262,V263,V264,V265,V268,V271,V274,V277,V282,V283,V289,V291,V303,V307,V310,V312,V315,id_01,id_02,id_03,id_04,id_05,id_06,id_09,id_10,id_11,id_12,id_13,id_15,id_16,id_17,id_19,id_20,id_28,id_29,id_30,id_33,id_35,id_36,id_37,DeviceType,DeviceInfo,TransactionHR,TransactionMT,TransactionDW,dollars,cents,P_parent_domain,P_domain_name,P_top_level_domain,card1_div_1000,card2_div_10,R_parent_domain,R_domain_name,R_top_level_domain,device_name,device_version,os_name,os_version
TransactionID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1,Unnamed: 95_level_1,Unnamed: 96_level_1,Unnamed: 97_level_1,Unnamed: 98_level_1,Unnamed: 99_level_1,Unnamed: 100_level_1,Unnamed: 101_level_1,Unnamed: 102_level_1,Unnamed: 103_level_1,Unnamed: 104_level_1,Unnamed: 105_level_1,Unnamed: 106_level_1,Unnamed: 107_level_1,Unnamed: 108_level_1,Unnamed: 109_level_1,Unnamed: 110_level_1,Unnamed: 111_level_1,Unnamed: 112_level_1,Unnamed: 113_level_1,Unnamed: 114_level_1,Unnamed: 115_level_1,Unnamed: 116_level_1,Unnamed: 117_level_1,Unnamed: 118_level_1,Unnamed: 119_level_1,Unnamed: 120_level_1,Unnamed: 121_level_1,Unnamed: 122_level_1,Unnamed: 123_level_1,Unnamed: 124_level_1,Unnamed: 125_level_1,Unnamed: 126_level_1,Unnamed: 127_level_1,Unnamed: 128_level_1,Unnamed: 129_level_1,Unnamed: 130_level_1,Unnamed: 131_level_1,Unnamed: 132_level_1,Unnamed: 133_level_1,Unnamed: 134_level_1,Unnamed: 135_level_1,Unnamed: 136_level_1,Unnamed: 137_level_1,Unnamed: 138_level_1,Unnamed: 139_level_1,Unnamed: 140_level_1,Unnamed: 141_level_1,Unnamed: 142_level_1,Unnamed: 143_level_1,Unnamed: 144_level_1,Unnamed: 145_level_1,Unnamed: 146_level_1,Unnamed: 147_level_1,Unnamed: 148_level_1,Unnamed: 149_level_1,Unnamed: 150_level_1,Unnamed: 151_level_1,Unnamed: 152_level_1,Unnamed: 153_level_1,Unnamed: 154_level_1,Unnamed: 155_level_1,Unnamed: 156_level_1,Unnamed: 157_level_1,Unnamed: 158_level_1,Unnamed: 159_level_1,Unnamed: 160_level_1,Unnamed: 161_level_1,Unnamed: 162_level_1,Unnamed: 163_level_1,Unnamed: 164_level_1,Unnamed: 165_level_1,Unnamed: 166_level_1,Unnamed: 167_level_1,Unnamed: 168_level_1,Unnamed: 169_level_1,Unnamed: 170_level_1,Unnamed: 171_level_1,Unnamed: 172_level_1,Unnamed: 173_level_1,Unnamed: 174_level_1,Unnamed: 175_level_1
2987000,86400,68.5,4,3417,500,42,1,38,1,166,65,19.0,31,31,1.0,1.0,0.0,0.0,1.0,0.0,1.0,2.0,0.0,1.0,1.0,14.0,,13.0,,,,,,13.0,13.0,,,,0.0,1,1,1,2,0,1,2,2,2,1.0,1.0,1.0,1.0,1.0,0.0,1.0,0.0,1.0,0.0,,,,,,,,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,117.0,0.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1.0,1.0,0.0,1.0,0.0,117.0,0.0,0.0,0.0,,,,,,,,,,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,0,0,5,68,5,16,24,7,4,51,16,24,8,13,293,7,68
2987001,86401,29.0,4,7922,303,42,2,2,1,173,65,,16,31,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,1.0,1.0,0.0,,,0.0,,,,,0.0,,,,,0.0,2,2,2,0,1,1,2,2,2,,,,,,,0.0,0.0,1.0,0.0,0.0,1.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,,,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,0,0,5,29,0,12,15,2,10,30,16,24,8,13,293,7,68
2987002,86469,59.0,4,9383,389,42,4,58,2,178,65,287.0,36,31,1.0,1.0,0.0,0.0,1.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,,,0.0,,,,,0.0,315.0,,,,315.0,1,1,1,0,0,0,0,0,0,1.0,1.0,1.0,1.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,,,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,0,1,5,59,0,15,28,2,12,39,16,24,8,13,293,7,68
2987003,86499,50.0,4,6991,466,42,2,14,2,282,65,,54,31,2.0,5.0,0.0,0.0,4.0,0.0,1.0,1.0,0.0,25.0,1.0,112.0,112.0,0.0,94.0,0.0,,,,84.0,,,,,111.0,2,2,2,0,1,0,2,2,2,,,,,,,1.0,0.0,1.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,1.0,1.0,0.0,10.0,1758.0,354.0,135.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,1.0,0.0,1758.0,354.0,135.0,0.0,,,,,,,,,,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,0,1,5,50,0,30,43,2,9,46,16,24,8,13,293,7,68
2987004,86506,50.0,1,9262,413,42,2,2,1,241,65,,16,31,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,1.0,1.0,0.0,,,,,,,,,,,,,,2,2,2,3,2,2,2,2,2,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5155.0,2840.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,70787.0,,,,,,,100.0,1,54,1,1,59,400,32,1,1,7,164,1,0,1,2,954,0,1,5,50,0,12,15,2,12,41,16,24,8,7,249,0,58


## Filling NaN with -1s

In [16]:
X_train.fillna(-1, inplace=True)

In [17]:
X_test.fillna(-1, inplace=True)

In [18]:
# Save data for future use
X_train.to_pickle('train_clean_neg1.pkl')
X_test.to_pickle('test_clean_neg1.pkl')

## Imputing using KNN

In [72]:
%%time
train_data = pd.read_pickle('basic_fe_train.pkl')
test_data = pd.read_pickle('basic_fe_test.pkl')

CPU times: user 2.04 s, sys: 1.65 s, total: 3.69 s
Wall time: 4.43 s


In [73]:
X_train = train_data.drop(['isFraud'], axis=1)
y_train = train_data['isFraud']

X_test = test_data

In [74]:
# Encoding the Categorical Features

X_train[catf] = X_train[catf].fillna('missing')
X_test[catf] = X_test[catf].fillna('missing')

X_train, X_test = label_encode(X_train, X_test, catf)

In [75]:
catf, numf = cat_num_features(X_train)

In [76]:
train_sample_10k = X_train.iloc[:10000]
test_sample_10k = X_test.iloc[:10000]

In [77]:
train_sample_10k.head()

Unnamed: 0_level_0,TransactionDT,TransactionAmt,ProductCD,card1,card2,card3,card4,card5,card6,addr1,addr2,dist1,P_emaildomain,R_emaildomain,C1,C2,C4,C5,C6,C7,C9,C11,C12,C13,C14,D1,D2,D3,D4,D5,D6,D8,D9,D10,D11,D12,D13,D14,D15,M1,M2,M3,M4,M5,M6,M7,M8,M9,V1,V3,V4,V6,V8,V11,V13,V18,V20,V30,V36,V37,V40,V44,V47,V48,V52,V54,V60,V70,V76,V78,V80,V81,V82,V87,V91,V99,V127,V130,V131,V139,V147,V156,V165,V166,V169,V171,V173,V174,V175,V176,V180,V183,V185,V195,V198,V203,V205,V207,V209,V210,V215,V216,V220,V221,V223,V230,V234,V235,V238,V240,V241,V250,V252,V257,V258,V260,V262,V263,V264,V265,V268,V271,V274,V277,V282,V283,V289,V291,V303,V307,V310,V312,V315,id_01,id_02,id_03,id_04,id_05,id_06,id_09,id_10,id_11,id_12,id_13,id_15,id_16,id_17,id_19,id_20,id_28,id_29,id_30,id_33,id_35,id_36,id_37,DeviceType,DeviceInfo,TransactionHR,TransactionMT,TransactionDW,dollars,cents,card1_div_1000,card2_div_10,P_parent_domain,P_domain_name,P_top_level_domain,R_parent_domain,R_domain_name,R_top_level_domain,device_name,device_version,os_name,os_version
TransactionID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1,Unnamed: 95_level_1,Unnamed: 96_level_1,Unnamed: 97_level_1,Unnamed: 98_level_1,Unnamed: 99_level_1,Unnamed: 100_level_1,Unnamed: 101_level_1,Unnamed: 102_level_1,Unnamed: 103_level_1,Unnamed: 104_level_1,Unnamed: 105_level_1,Unnamed: 106_level_1,Unnamed: 107_level_1,Unnamed: 108_level_1,Unnamed: 109_level_1,Unnamed: 110_level_1,Unnamed: 111_level_1,Unnamed: 112_level_1,Unnamed: 113_level_1,Unnamed: 114_level_1,Unnamed: 115_level_1,Unnamed: 116_level_1,Unnamed: 117_level_1,Unnamed: 118_level_1,Unnamed: 119_level_1,Unnamed: 120_level_1,Unnamed: 121_level_1,Unnamed: 122_level_1,Unnamed: 123_level_1,Unnamed: 124_level_1,Unnamed: 125_level_1,Unnamed: 126_level_1,Unnamed: 127_level_1,Unnamed: 128_level_1,Unnamed: 129_level_1,Unnamed: 130_level_1,Unnamed: 131_level_1,Unnamed: 132_level_1,Unnamed: 133_level_1,Unnamed: 134_level_1,Unnamed: 135_level_1,Unnamed: 136_level_1,Unnamed: 137_level_1,Unnamed: 138_level_1,Unnamed: 139_level_1,Unnamed: 140_level_1,Unnamed: 141_level_1,Unnamed: 142_level_1,Unnamed: 143_level_1,Unnamed: 144_level_1,Unnamed: 145_level_1,Unnamed: 146_level_1,Unnamed: 147_level_1,Unnamed: 148_level_1,Unnamed: 149_level_1,Unnamed: 150_level_1,Unnamed: 151_level_1,Unnamed: 152_level_1,Unnamed: 153_level_1,Unnamed: 154_level_1,Unnamed: 155_level_1,Unnamed: 156_level_1,Unnamed: 157_level_1,Unnamed: 158_level_1,Unnamed: 159_level_1,Unnamed: 160_level_1,Unnamed: 161_level_1,Unnamed: 162_level_1,Unnamed: 163_level_1,Unnamed: 164_level_1,Unnamed: 165_level_1,Unnamed: 166_level_1,Unnamed: 167_level_1,Unnamed: 168_level_1,Unnamed: 169_level_1,Unnamed: 170_level_1,Unnamed: 171_level_1,Unnamed: 172_level_1,Unnamed: 173_level_1,Unnamed: 174_level_1,Unnamed: 175_level_1
2987000,86400,68.5,4,3417,500,42,1,38,1,166,65,19.0,31,31,1.0,1.0,0.0,0.0,1.0,0.0,1.0,2.0,0.0,1.0,1.0,14.0,,13.0,,,,,,13.0,13.0,,,,0.0,1,1,1,2,0,1,2,2,2,1.0,1.0,1.0,1.0,1.0,0.0,1.0,0.0,1.0,0.0,,,,,,,,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,117.0,0.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1.0,1.0,0.0,1.0,0.0,117.0,0.0,0.0,0.0,,,,,,,,,,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,0,0,5,68,5,4,51,16,24,7,16,24,8,13,293,7,68
2987001,86401,29.0,4,7922,303,42,2,2,1,173,65,,16,31,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,1.0,1.0,0.0,,,0.0,,,,,0.0,,,,,0.0,2,2,2,0,1,1,2,2,2,,,,,,,0.0,0.0,1.0,0.0,0.0,1.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,,,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,0,0,5,29,0,10,30,12,15,2,16,24,8,13,293,7,68
2987002,86469,59.0,4,9383,389,42,4,58,2,178,65,287.0,36,31,1.0,1.0,0.0,0.0,1.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,,,0.0,,,,,0.0,315.0,,,,315.0,1,1,1,0,0,0,0,0,0,1.0,1.0,1.0,1.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,,,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,0,1,5,59,0,12,39,15,28,2,16,24,8,13,293,7,68
2987003,86499,50.0,4,6991,466,42,2,14,2,282,65,,54,31,2.0,5.0,0.0,0.0,4.0,0.0,1.0,1.0,0.0,25.0,1.0,112.0,112.0,0.0,94.0,0.0,,,,84.0,,,,,111.0,2,2,2,0,1,0,2,2,2,,,,,,,1.0,0.0,1.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,1.0,1.0,0.0,10.0,1758.0,354.0,135.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,1.0,0.0,1758.0,354.0,135.0,0.0,,,,,,,,,,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,0,1,5,50,0,9,46,30,43,2,16,24,8,13,293,7,68
2987004,86506,50.0,1,9262,413,42,2,2,1,241,65,,16,31,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,1.0,1.0,0.0,,,,,,,,,,,,,,2,2,2,3,2,2,2,2,2,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5155.0,2840.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,70787.0,,,,,,,100.0,1,54,1,1,59,400,32,1,1,7,164,1,0,1,2,954,0,1,5,50,0,12,41,12,15,2,16,24,8,7,249,0,58


In [78]:
test_sample_10k.head()

Unnamed: 0_level_0,TransactionDT,TransactionAmt,ProductCD,card1,card2,card3,card4,card5,card6,addr1,addr2,dist1,P_emaildomain,R_emaildomain,C1,C2,C4,C5,C6,C7,C9,C11,C12,C13,C14,D1,D2,D3,D4,D5,D6,D8,D9,D10,D11,D12,D13,D14,D15,M1,M2,M3,M4,M5,M6,M7,M8,M9,V1,V3,V4,V6,V8,V11,V13,V18,V20,V30,V36,V37,V40,V44,V47,V48,V52,V54,V60,V70,V76,V78,V80,V81,V82,V87,V91,V99,V127,V130,V131,V139,V147,V156,V165,V166,V169,V171,V173,V174,V175,V176,V180,V183,V185,V195,V198,V203,V205,V207,V209,V210,V215,V216,V220,V221,V223,V230,V234,V235,V238,V240,V241,V250,V252,V257,V258,V260,V262,V263,V264,V265,V268,V271,V274,V277,V282,V283,V289,V291,V303,V307,V310,V312,V315,id_01,id_02,id_03,id_04,id_05,id_06,id_09,id_10,id_11,id_12,id_13,id_15,id_16,id_17,id_19,id_20,id_28,id_29,id_30,id_33,id_35,id_36,id_37,DeviceType,DeviceInfo,TransactionHR,TransactionMT,TransactionDW,dollars,cents,card1_div_1000,card2_div_10,P_parent_domain,P_domain_name,P_top_level_domain,R_parent_domain,R_domain_name,R_top_level_domain,device_name,device_version,os_name,os_version
TransactionID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1,Unnamed: 95_level_1,Unnamed: 96_level_1,Unnamed: 97_level_1,Unnamed: 98_level_1,Unnamed: 99_level_1,Unnamed: 100_level_1,Unnamed: 101_level_1,Unnamed: 102_level_1,Unnamed: 103_level_1,Unnamed: 104_level_1,Unnamed: 105_level_1,Unnamed: 106_level_1,Unnamed: 107_level_1,Unnamed: 108_level_1,Unnamed: 109_level_1,Unnamed: 110_level_1,Unnamed: 111_level_1,Unnamed: 112_level_1,Unnamed: 113_level_1,Unnamed: 114_level_1,Unnamed: 115_level_1,Unnamed: 116_level_1,Unnamed: 117_level_1,Unnamed: 118_level_1,Unnamed: 119_level_1,Unnamed: 120_level_1,Unnamed: 121_level_1,Unnamed: 122_level_1,Unnamed: 123_level_1,Unnamed: 124_level_1,Unnamed: 125_level_1,Unnamed: 126_level_1,Unnamed: 127_level_1,Unnamed: 128_level_1,Unnamed: 129_level_1,Unnamed: 130_level_1,Unnamed: 131_level_1,Unnamed: 132_level_1,Unnamed: 133_level_1,Unnamed: 134_level_1,Unnamed: 135_level_1,Unnamed: 136_level_1,Unnamed: 137_level_1,Unnamed: 138_level_1,Unnamed: 139_level_1,Unnamed: 140_level_1,Unnamed: 141_level_1,Unnamed: 142_level_1,Unnamed: 143_level_1,Unnamed: 144_level_1,Unnamed: 145_level_1,Unnamed: 146_level_1,Unnamed: 147_level_1,Unnamed: 148_level_1,Unnamed: 149_level_1,Unnamed: 150_level_1,Unnamed: 151_level_1,Unnamed: 152_level_1,Unnamed: 153_level_1,Unnamed: 154_level_1,Unnamed: 155_level_1,Unnamed: 156_level_1,Unnamed: 157_level_1,Unnamed: 158_level_1,Unnamed: 159_level_1,Unnamed: 160_level_1,Unnamed: 161_level_1,Unnamed: 162_level_1,Unnamed: 163_level_1,Unnamed: 164_level_1,Unnamed: 165_level_1,Unnamed: 166_level_1,Unnamed: 167_level_1,Unnamed: 168_level_1,Unnamed: 169_level_1,Unnamed: 170_level_1,Unnamed: 171_level_1,Unnamed: 172_level_1,Unnamed: 173_level_1,Unnamed: 174_level_1,Unnamed: 175_level_1
3663549,18403224,31.95,4,365,10,42,4,108,2,52,65,1.0,16,31,6.0,6.0,0.0,3.0,4.0,0.0,6.0,5.0,1.0,115.0,6.0,419.0,419.0,27.0,398.0,27.0,,,,418.0,203.0,,,,409.0,1,1,0,3,2,0,1,1,1,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,1.0,1.0,47.950001,47.950001,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,1.0,0.0,47.950001,47.950001,0.0,0.0,,,,,,,,,,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,0,0,0,31,95,1,1,12,15,2,16,24,8,13,293,7,68
3663550,18403263,49.0,4,9099,10,42,4,108,2,151,65,4.0,2,31,3.0,2.0,0.0,0.0,1.0,0.0,2.0,1.0,1.0,12.0,2.0,149.0,149.0,7.0,634.0,7.0,,,,231.0,634.0,,,,634.0,1,0,0,0,2,0,2,2,2,1.0,1.0,1.0,1.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,1.0,1.0,0.0,4.0,280.0,280.0,77.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,1.0,0.0,280.0,280.0,77.0,0.0,,,,,,,,,,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,0,1,0,49,0,12,1,2,2,2,16,24,8,13,293,7,68
3663551,18403310,171.0,4,9245,473,42,4,108,2,280,65,2635.0,19,31,2.0,2.0,0.0,0.0,5.0,0.0,4.0,2.0,0.0,22.0,2.0,137.0,137.0,10.0,97.0,10.0,,,,136.0,136.0,,,,97.0,1,1,0,0,0,0,0,0,0,1.0,1.0,1.0,1.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,2.0,2.0,0.0,0.0,1.0,1.0,0.0,3.0,968.0,705.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,2.0,0.0,1321.0,1058.0,0.0,0.0,,,,,,,,,,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,0,1,0,171,0,12,47,15,17,2,16,24,8,13,293,7,68
3663552,18403310,284.95,4,870,259,42,4,58,2,79,65,17.0,16,31,5.0,2.0,0.0,1.0,1.0,0.0,2.0,2.0,0.0,7.0,4.0,42.0,42.0,41.0,242.0,41.0,,,,242.0,242.0,,,,242.0,1,1,1,3,2,1,2,2,2,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,1.0,1.0,2.0,2.0,0.0,2.0,2.0,1.0,0.0,1.0,0.0,1.0,1.0,1.0,0.0,0.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,282.540009,,,,,,,,,,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,0,1,0,284,95,1,26,12,15,2,16,24,8,13,293,7,68
3663553,18403317,67.95,4,6894,351,42,2,14,2,127,65,6.0,16,31,6.0,6.0,0.0,2.0,5.0,0.0,5.0,6.0,0.0,14.0,6.0,22.0,22.0,0.0,22.0,0.0,,,,22.0,22.0,,,,22.0,1,1,1,3,2,0,0,1,1,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,1.0,1.0,1.0,1.0,0.0,1.0,1.0,1.0,0.0,1.0,0.0,1.0,1.0,1.0,0.0,0.0,1.0,1.0,1.0,3.0,183.850006,183.850006,67.949997,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1.0,1.0,1.0,1.0,0.0,183.850006,183.850006,67.949997,67.949997,,,,,,,,,,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,0,1,0,67,95,9,35,12,15,2,16,24,8,13,293,7,68


In [38]:
knn2 = KNNImputer(n_neighbors=2)

In [39]:
knn2.fit(train_sample_10k[numf])

In [79]:
knn2_test = KNNImputer(n_neighbors=2)

In [80]:
knn2_test.fit(test_sample_10k[numf])

In [40]:
train_sample_10k[numf] = knn2.transform(train_sample_10k[numf])

In [41]:
train_sample_10k[numf].head()

Unnamed: 0_level_0,TransactionDT,TransactionAmt,dist1,C1,C2,C4,C5,C6,C7,C9,C11,C12,C13,C14,D1,D2,D3,D4,D5,D6,D8,D9,D10,D11,D12,D13,D14,D15,V1,V3,V4,V6,V8,V11,V13,V18,V20,V30,V36,V37,V40,V44,V47,V48,V52,V54,V60,V70,V76,V78,V80,V81,V82,V87,V91,V99,V127,V130,V131,V139,V147,V156,V165,V166,V169,V171,V173,V174,V175,V176,V180,V183,V185,V195,V198,V203,V205,V207,V209,V210,V215,V216,V220,V221,V223,V230,V234,V235,V238,V240,V241,V250,V252,V257,V258,V260,V262,V263,V264,V265,V268,V271,V274,V277,V282,V283,V289,V291,V303,V307,V310,V312,V315,id_01,id_02,id_03,id_04,id_05,id_06,id_09,id_10,id_11,TransactionHR,TransactionMT,dollars,cents
TransactionID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1,Unnamed: 95_level_1,Unnamed: 96_level_1,Unnamed: 97_level_1,Unnamed: 98_level_1,Unnamed: 99_level_1,Unnamed: 100_level_1,Unnamed: 101_level_1,Unnamed: 102_level_1,Unnamed: 103_level_1,Unnamed: 104_level_1,Unnamed: 105_level_1,Unnamed: 106_level_1,Unnamed: 107_level_1,Unnamed: 108_level_1,Unnamed: 109_level_1,Unnamed: 110_level_1,Unnamed: 111_level_1,Unnamed: 112_level_1,Unnamed: 113_level_1,Unnamed: 114_level_1,Unnamed: 115_level_1,Unnamed: 116_level_1,Unnamed: 117_level_1,Unnamed: 118_level_1,Unnamed: 119_level_1,Unnamed: 120_level_1,Unnamed: 121_level_1,Unnamed: 122_level_1,Unnamed: 123_level_1,Unnamed: 124_level_1,Unnamed: 125_level_1,Unnamed: 126_level_1
2987000,86400.0,68.5,19.0,1.0,1.0,0.0,0.0,1.0,0.0,1.0,2.0,0.0,1.0,1.0,14.0,59.0,13.0,0.0,10.5,0.0,23.5,0.0,13.0,13.0,0.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,0.0,1.0,0.0,1.0,0.0,0.5,1.0,0.0,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,117.0,0.0,0.0,0.0,0.0,0.0,5155.0,2840.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,1.0,0.0,117.0,0.0,0.0,0.0,-2.5,84866.0,1.5,0.0,0.5,-2.5,1.5,0.0,100.0,0.0,0.0,68.0,5.0
2987001,86401.0,29.0,27.5,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,1.0,1.0,0.0,59.0,12.0,0.0,10.5,0.0,23.5,0.0,0.0,6.5,0.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5155.0,2840.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,-2.5,84866.0,1.5,0.0,0.5,-2.5,1.5,0.0,100.0,0.0,0.0,29.0,0.0
2987002,86469.0,59.0,287.0,1.0,1.0,0.0,0.0,1.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,59.0,10.5,0.0,10.5,0.0,23.5,0.0,0.0,315.0,0.0,0.0,0.0,315.0,1.0,1.0,1.0,1.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5155.0,2840.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,-2.5,84866.0,1.5,0.0,0.5,-2.5,1.5,0.0,100.0,0.0,1.0,59.0,0.0
2987003,86499.0,50.0,68.5,2.0,5.0,0.0,0.0,4.0,0.0,1.0,1.0,0.0,25.0,1.0,112.0,112.0,0.0,94.0,0.0,0.0,83.0,0.0,84.0,19.5,0.0,0.0,0.0,111.0,1.0,1.0,1.0,1.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,1.0,1.0,0.0,10.0,1758.0,354.0,135.0,0.0,0.0,0.0,2577.5,1370.0,1.5,2.5,0.5,1.0,1.0,2.5,0.5,0.5,0.5,1.0,1.0,83.107697,45.163952,45.163952,45.163952,45.163952,37.943748,37.943748,1.5,2.5,1.0,2.5,0.5,0.5,0.5,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,83.107697,83.107697,83.107697,45.163952,45.163952,0.0,37.943748,0.0,0.0,0.0,1.0,0.0,1758.0,354.0,135.0,0.0,-5.0,206731.5,0.0,0.0,0.0,-3.0,0.0,0.0,100.0,0.0,1.0,50.0,0.0
2987004,86506.0,50.0,161.5,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,1.0,1.0,0.0,66.5,20.5,0.0,20.5,17.5,110.0,0.0,0.0,157.5,17.5,159.5,0.0,157.5,1.0,1.0,1.0,1.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5155.0,2840.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,70787.0,0.0,0.0,0.5,-0.5,0.5,0.0,100.0,0.0,1.0,50.0,0.0


In [42]:
X_train[numf] = knn2.transform(X_train[numf])
X_train.to_pickle('train_clean_knn2.pkl')

In [43]:
X_train.head()

Unnamed: 0_level_0,TransactionDT,TransactionAmt,ProductCD,card1,card2,card3,card4,card5,card6,addr1,addr2,dist1,P_emaildomain,R_emaildomain,C1,C2,C4,C5,C6,C7,C9,C11,C12,C13,C14,D1,D2,D3,D4,D5,D6,D8,D9,D10,D11,D12,D13,D14,D15,M1,M2,M3,M4,M5,M6,M7,M8,M9,V1,V3,V4,V6,V8,V11,V13,V18,V20,V30,V36,V37,V40,V44,V47,V48,V52,V54,V60,V70,V76,V78,V80,V81,V82,V87,V91,V99,V127,V130,V131,V139,V147,V156,V165,V166,V169,V171,V173,V174,V175,V176,V180,V183,V185,V195,V198,V203,V205,V207,V209,V210,V215,V216,V220,V221,V223,V230,V234,V235,V238,V240,V241,V250,V252,V257,V258,V260,V262,V263,V264,V265,V268,V271,V274,V277,V282,V283,V289,V291,V303,V307,V310,V312,V315,id_01,id_02,id_03,id_04,id_05,id_06,id_09,id_10,id_11,id_12,id_13,id_15,id_16,id_17,id_19,id_20,id_28,id_29,id_30,id_33,id_35,id_36,id_37,DeviceType,DeviceInfo,TransactionHR,TransactionMT,TransactionDW,dollars,cents,P_parent_domain,P_domain_name,P_top_level_domain,card1_div_1000,card2_div_10,R_parent_domain,R_domain_name,R_top_level_domain,device_name,device_version,os_name,os_version
TransactionID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1,Unnamed: 95_level_1,Unnamed: 96_level_1,Unnamed: 97_level_1,Unnamed: 98_level_1,Unnamed: 99_level_1,Unnamed: 100_level_1,Unnamed: 101_level_1,Unnamed: 102_level_1,Unnamed: 103_level_1,Unnamed: 104_level_1,Unnamed: 105_level_1,Unnamed: 106_level_1,Unnamed: 107_level_1,Unnamed: 108_level_1,Unnamed: 109_level_1,Unnamed: 110_level_1,Unnamed: 111_level_1,Unnamed: 112_level_1,Unnamed: 113_level_1,Unnamed: 114_level_1,Unnamed: 115_level_1,Unnamed: 116_level_1,Unnamed: 117_level_1,Unnamed: 118_level_1,Unnamed: 119_level_1,Unnamed: 120_level_1,Unnamed: 121_level_1,Unnamed: 122_level_1,Unnamed: 123_level_1,Unnamed: 124_level_1,Unnamed: 125_level_1,Unnamed: 126_level_1,Unnamed: 127_level_1,Unnamed: 128_level_1,Unnamed: 129_level_1,Unnamed: 130_level_1,Unnamed: 131_level_1,Unnamed: 132_level_1,Unnamed: 133_level_1,Unnamed: 134_level_1,Unnamed: 135_level_1,Unnamed: 136_level_1,Unnamed: 137_level_1,Unnamed: 138_level_1,Unnamed: 139_level_1,Unnamed: 140_level_1,Unnamed: 141_level_1,Unnamed: 142_level_1,Unnamed: 143_level_1,Unnamed: 144_level_1,Unnamed: 145_level_1,Unnamed: 146_level_1,Unnamed: 147_level_1,Unnamed: 148_level_1,Unnamed: 149_level_1,Unnamed: 150_level_1,Unnamed: 151_level_1,Unnamed: 152_level_1,Unnamed: 153_level_1,Unnamed: 154_level_1,Unnamed: 155_level_1,Unnamed: 156_level_1,Unnamed: 157_level_1,Unnamed: 158_level_1,Unnamed: 159_level_1,Unnamed: 160_level_1,Unnamed: 161_level_1,Unnamed: 162_level_1,Unnamed: 163_level_1,Unnamed: 164_level_1,Unnamed: 165_level_1,Unnamed: 166_level_1,Unnamed: 167_level_1,Unnamed: 168_level_1,Unnamed: 169_level_1,Unnamed: 170_level_1,Unnamed: 171_level_1,Unnamed: 172_level_1,Unnamed: 173_level_1,Unnamed: 174_level_1,Unnamed: 175_level_1
2987000,86400.0,68.5,4,3417,500,42,1,38,1,166,65,19.0,31,31,1.0,1.0,0.0,0.0,1.0,0.0,1.0,2.0,0.0,1.0,1.0,14.0,59.0,13.0,0.0,10.5,0.0,23.5,0.0,13.0,13.0,0.0,0.0,0.0,0.0,1,1,1,2,0,1,2,2,2,1.0,1.0,1.0,1.0,1.0,0.0,1.0,0.0,1.0,0.0,0.5,1.0,0.0,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,117.0,0.0,0.0,0.0,0.0,0.0,5155.0,2840.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,1.0,0.0,117.0,0.0,0.0,0.0,-2.5,84866.0,1.5,0.0,0.5,-2.5,1.5,0.0,100.0,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,0.0,0.0,5,68.0,5.0,16,24,7,4,51,16,24,8,13,293,7,68
2987001,86401.0,29.0,4,7922,303,42,2,2,1,173,65,27.5,16,31,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,1.0,1.0,0.0,59.0,12.0,0.0,10.5,0.0,23.5,0.0,0.0,6.5,0.0,0.0,0.0,0.0,2,2,2,0,1,1,2,2,2,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5155.0,2840.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,-2.5,84866.0,1.5,0.0,0.5,-2.5,1.5,0.0,100.0,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,0.0,0.0,5,29.0,0.0,12,15,2,10,30,16,24,8,13,293,7,68
2987002,86469.0,59.0,4,9383,389,42,4,58,2,178,65,287.0,36,31,1.0,1.0,0.0,0.0,1.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,59.0,10.5,0.0,10.5,0.0,23.5,0.0,0.0,315.0,0.0,0.0,0.0,315.0,1,1,1,0,0,0,0,0,0,1.0,1.0,1.0,1.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5155.0,2840.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,-2.5,84866.0,1.5,0.0,0.5,-2.5,1.5,0.0,100.0,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,0.0,1.0,5,59.0,0.0,15,28,2,12,39,16,24,8,13,293,7,68
2987003,86499.0,50.0,4,6991,466,42,2,14,2,282,65,68.5,54,31,2.0,5.0,0.0,0.0,4.0,0.0,1.0,1.0,0.0,25.0,1.0,112.0,112.0,0.0,94.0,0.0,0.0,83.0,0.0,84.0,19.5,0.0,0.0,0.0,111.0,2,2,2,0,1,0,2,2,2,1.0,1.0,1.0,1.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,1.0,1.0,0.0,10.0,1758.0,354.0,135.0,0.0,0.0,0.0,2577.5,1370.0,1.5,2.5,0.5,1.0,1.0,2.5,0.5,0.5,0.5,1.0,1.0,83.107697,45.163952,45.163952,45.163952,45.163952,37.943748,37.943748,1.5,2.5,1.0,2.5,0.5,0.5,0.5,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,83.107697,83.107697,83.107697,45.163952,45.163952,0.0,37.943748,0.0,0.0,0.0,1.0,0.0,1758.0,354.0,135.0,0.0,-5.0,206731.5,0.0,0.0,0.0,-3.0,0.0,0.0,100.0,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,0.0,1.0,5,50.0,0.0,30,43,2,9,46,16,24,8,13,293,7,68
2987004,86506.0,50.0,1,9262,413,42,2,2,1,241,65,161.5,16,31,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,1.0,1.0,0.0,66.5,20.5,0.0,20.5,17.5,110.0,0.0,0.0,157.5,17.5,159.5,0.0,157.5,2,2,2,3,2,2,2,2,2,1.0,1.0,1.0,1.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5155.0,2840.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,70787.0,0.0,0.0,0.5,-0.5,0.5,0.0,100.0,1,54,1,1,59,400,32,1,1,7,164,1,0,1,2,954,0.0,1.0,5,50.0,0.0,12,15,2,12,41,16,24,8,7,249,0,58


In [45]:
train_data = pd.concat([X_train, y_train], axis=1)

In [46]:
train_data.shape

(590540, 176)

In [49]:
train_data.to_pickle('train_clean_knn2.pkl')

In [81]:
X_test.shape

(506691, 175)

In [84]:
X_test[numf] = knn2_test.transform(X_test[numf])
X_test.to_pickle('test_clean_knn2.pkl')

In [85]:
X_test.head()

Unnamed: 0_level_0,TransactionDT,TransactionAmt,ProductCD,card1,card2,card3,card4,card5,card6,addr1,addr2,dist1,P_emaildomain,R_emaildomain,C1,C2,C4,C5,C6,C7,C9,C11,C12,C13,C14,D1,D2,D3,D4,D5,D6,D8,D9,D10,D11,D12,D13,D14,D15,M1,M2,M3,M4,M5,M6,M7,M8,M9,V1,V3,V4,V6,V8,V11,V13,V18,V20,V30,V36,V37,V40,V44,V47,V48,V52,V54,V60,V70,V76,V78,V80,V81,V82,V87,V91,V99,V127,V130,V131,V139,V147,V156,V165,V166,V169,V171,V173,V174,V175,V176,V180,V183,V185,V195,V198,V203,V205,V207,V209,V210,V215,V216,V220,V221,V223,V230,V234,V235,V238,V240,V241,V250,V252,V257,V258,V260,V262,V263,V264,V265,V268,V271,V274,V277,V282,V283,V289,V291,V303,V307,V310,V312,V315,id_01,id_02,id_03,id_04,id_05,id_06,id_09,id_10,id_11,id_12,id_13,id_15,id_16,id_17,id_19,id_20,id_28,id_29,id_30,id_33,id_35,id_36,id_37,DeviceType,DeviceInfo,TransactionHR,TransactionMT,TransactionDW,dollars,cents,card1_div_1000,card2_div_10,P_parent_domain,P_domain_name,P_top_level_domain,R_parent_domain,R_domain_name,R_top_level_domain,device_name,device_version,os_name,os_version
TransactionID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1,Unnamed: 95_level_1,Unnamed: 96_level_1,Unnamed: 97_level_1,Unnamed: 98_level_1,Unnamed: 99_level_1,Unnamed: 100_level_1,Unnamed: 101_level_1,Unnamed: 102_level_1,Unnamed: 103_level_1,Unnamed: 104_level_1,Unnamed: 105_level_1,Unnamed: 106_level_1,Unnamed: 107_level_1,Unnamed: 108_level_1,Unnamed: 109_level_1,Unnamed: 110_level_1,Unnamed: 111_level_1,Unnamed: 112_level_1,Unnamed: 113_level_1,Unnamed: 114_level_1,Unnamed: 115_level_1,Unnamed: 116_level_1,Unnamed: 117_level_1,Unnamed: 118_level_1,Unnamed: 119_level_1,Unnamed: 120_level_1,Unnamed: 121_level_1,Unnamed: 122_level_1,Unnamed: 123_level_1,Unnamed: 124_level_1,Unnamed: 125_level_1,Unnamed: 126_level_1,Unnamed: 127_level_1,Unnamed: 128_level_1,Unnamed: 129_level_1,Unnamed: 130_level_1,Unnamed: 131_level_1,Unnamed: 132_level_1,Unnamed: 133_level_1,Unnamed: 134_level_1,Unnamed: 135_level_1,Unnamed: 136_level_1,Unnamed: 137_level_1,Unnamed: 138_level_1,Unnamed: 139_level_1,Unnamed: 140_level_1,Unnamed: 141_level_1,Unnamed: 142_level_1,Unnamed: 143_level_1,Unnamed: 144_level_1,Unnamed: 145_level_1,Unnamed: 146_level_1,Unnamed: 147_level_1,Unnamed: 148_level_1,Unnamed: 149_level_1,Unnamed: 150_level_1,Unnamed: 151_level_1,Unnamed: 152_level_1,Unnamed: 153_level_1,Unnamed: 154_level_1,Unnamed: 155_level_1,Unnamed: 156_level_1,Unnamed: 157_level_1,Unnamed: 158_level_1,Unnamed: 159_level_1,Unnamed: 160_level_1,Unnamed: 161_level_1,Unnamed: 162_level_1,Unnamed: 163_level_1,Unnamed: 164_level_1,Unnamed: 165_level_1,Unnamed: 166_level_1,Unnamed: 167_level_1,Unnamed: 168_level_1,Unnamed: 169_level_1,Unnamed: 170_level_1,Unnamed: 171_level_1,Unnamed: 172_level_1,Unnamed: 173_level_1,Unnamed: 174_level_1,Unnamed: 175_level_1
3663549,18403224.0,31.95,4,365,10,42,4,108,2,52,65,1.0,16,31,6.0,6.0,0.0,3.0,4.0,0.0,6.0,5.0,1.0,115.0,6.0,419.0,419.0,27.0,398.0,27.0,317.0,11.0,0.0,418.0,203.0,0.0,0.0,0.0,409.0,1,1,0,3,2,0,1,1,1,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,1.0,1.0,47.950001,47.950001,0.0,0.5,0.0,0.5,0.0,0.0,0.0,1.0,0.0,0.5,0.5,1.0,0.0,0.0,0.0,1.0,1.0,20.0,0.0,0.0,20.0,20.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,47.950001,47.950001,0.0,0.0,-22.5,141934.5,0.0,0.0,0.0,0.0,0.0,0.0,100.0,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,0.0,0.0,0,31.0,95.0,1,1,12,15,2,16,24,8,13,293,7,68
3663550,18403263.0,49.0,4,9099,10,42,4,108,2,151,65,4.0,2,31,3.0,2.0,0.0,0.0,1.0,0.0,2.0,1.0,1.0,12.0,2.0,149.0,149.0,7.0,634.0,7.0,317.0,11.0,0.0,231.0,634.0,283.5,0.0,0.0,634.0,1,0,0,0,2,0,2,2,2,1.0,1.0,1.0,1.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,1.0,1.0,0.0,4.0,280.0,280.0,77.0,0.5,0.0,0.5,0.0,0.0,0.0,1.0,0.0,0.5,0.5,1.0,0.0,0.0,0.0,1.0,1.0,20.0,0.0,0.0,20.0,20.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,280.0,280.0,77.0,0.0,-22.5,141934.5,0.0,0.0,0.0,0.0,0.0,0.0,100.0,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,0.0,1.0,0,49.0,0.0,12,1,2,2,2,16,24,8,13,293,7,68
3663551,18403310.0,171.0,4,9245,473,42,4,108,2,280,65,2635.0,19,31,2.0,2.0,0.0,0.0,5.0,0.0,4.0,2.0,0.0,22.0,2.0,137.0,137.0,10.0,97.0,10.0,317.0,11.0,0.0,136.0,136.0,0.0,0.0,0.0,97.0,1,1,0,0,0,0,0,0,0,1.0,1.0,1.0,1.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,2.0,2.0,0.0,0.0,1.0,1.0,0.0,3.0,968.0,705.0,0.0,1.5,0.0,0.5,50.0,0.0,0.0,1.0,0.0,0.5,0.5,1.0,0.0,0.0,0.0,1.0,1.0,20.0,0.0,0.0,20.0,20.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.0,0.0,1321.0,1058.0,0.0,0.0,-22.5,141934.5,0.0,0.0,0.0,0.0,0.0,0.0,100.0,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,0.0,1.0,0,171.0,0.0,12,47,15,17,2,16,24,8,13,293,7,68
3663552,18403310.0,284.95,4,870,259,42,4,58,2,79,65,17.0,16,31,5.0,2.0,0.0,1.0,1.0,0.0,2.0,2.0,0.0,7.0,4.0,42.0,42.0,41.0,242.0,41.0,0.0,11.0,0.0,242.0,242.0,0.0,0.0,0.0,242.0,1,1,1,3,2,1,2,2,2,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,1.0,1.0,2.0,2.0,0.0,2.0,2.0,1.0,0.0,1.0,0.0,1.0,1.0,1.0,0.0,0.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.5,0.0,0.5,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,282.540009,-25.0,232750.0,0.0,0.0,0.5,0.0,0.0,0.0,100.0,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,0.0,1.0,0,284.0,95.0,1,26,12,15,2,16,24,8,13,293,7,68
3663553,18403317.0,67.95,4,6894,351,42,2,14,2,127,65,6.0,16,31,6.0,6.0,0.0,2.0,5.0,0.0,5.0,6.0,0.0,14.0,6.0,22.0,22.0,0.0,22.0,0.0,0.0,11.0,0.0,22.0,22.0,0.0,0.0,0.0,22.0,1,1,1,3,2,0,0,1,1,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,1.0,1.0,1.0,1.0,0.0,1.0,1.0,1.0,0.0,1.0,0.0,1.0,1.0,1.0,0.0,0.0,1.0,1.0,1.0,3.0,183.850006,183.850006,67.949997,0.5,0.0,0.5,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,0.0,183.850006,183.850006,67.949997,67.949997,-25.0,232750.0,0.0,0.0,0.5,0.0,0.0,0.0,100.0,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,0.0,1.0,0,67.0,95.0,9,35,12,15,2,16,24,8,13,293,7,68


In [None]:
X_test.isna().sum()

In [87]:
X_test.to_pickle('test_clean_knn2.pkl')

## Scaling Numf

In [4]:
train_data = pd.read_pickle('train_clean_knn2.pkl')
test_data = pd.read_pickle('test_clean_knn2.pkl')

In [6]:
train_data.head()

Unnamed: 0_level_0,TransactionDT,TransactionAmt,ProductCD,card1,card2,card3,card4,card5,card6,addr1,addr2,dist1,P_emaildomain,R_emaildomain,C1,C2,C4,C5,C6,C7,C9,C11,C12,C13,C14,D1,D2,D3,D4,D5,D6,D8,D9,D10,D11,D12,D13,D14,D15,M1,M2,M3,M4,M5,M6,M7,M8,M9,V1,V3,V4,V6,V8,V11,V13,V18,V20,V30,V36,V37,V40,V44,V47,V48,V52,V54,V60,V70,V76,V78,V80,V81,V82,V87,V91,V99,V127,V130,V131,V139,V147,V156,V165,V166,V169,V171,V173,V174,V175,V176,V180,V183,V185,V195,V198,V203,V205,V207,V209,V210,V215,V216,V220,V221,V223,V230,V234,V235,V238,V240,V241,V250,V252,V257,V258,V260,V262,V263,V264,V265,V268,V271,V274,V277,V282,V283,V289,V291,V303,V307,V310,V312,V315,id_01,id_02,id_03,id_04,id_05,id_06,id_09,id_10,id_11,id_12,id_13,id_15,id_16,id_17,id_19,id_20,id_28,id_29,id_30,id_33,id_35,id_36,id_37,DeviceType,DeviceInfo,TransactionHR,TransactionMT,TransactionDW,dollars,cents,P_parent_domain,P_domain_name,P_top_level_domain,card1_div_1000,card2_div_10,R_parent_domain,R_domain_name,R_top_level_domain,device_name,device_version,os_name,os_version,isFraud
TransactionID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1,Unnamed: 95_level_1,Unnamed: 96_level_1,Unnamed: 97_level_1,Unnamed: 98_level_1,Unnamed: 99_level_1,Unnamed: 100_level_1,Unnamed: 101_level_1,Unnamed: 102_level_1,Unnamed: 103_level_1,Unnamed: 104_level_1,Unnamed: 105_level_1,Unnamed: 106_level_1,Unnamed: 107_level_1,Unnamed: 108_level_1,Unnamed: 109_level_1,Unnamed: 110_level_1,Unnamed: 111_level_1,Unnamed: 112_level_1,Unnamed: 113_level_1,Unnamed: 114_level_1,Unnamed: 115_level_1,Unnamed: 116_level_1,Unnamed: 117_level_1,Unnamed: 118_level_1,Unnamed: 119_level_1,Unnamed: 120_level_1,Unnamed: 121_level_1,Unnamed: 122_level_1,Unnamed: 123_level_1,Unnamed: 124_level_1,Unnamed: 125_level_1,Unnamed: 126_level_1,Unnamed: 127_level_1,Unnamed: 128_level_1,Unnamed: 129_level_1,Unnamed: 130_level_1,Unnamed: 131_level_1,Unnamed: 132_level_1,Unnamed: 133_level_1,Unnamed: 134_level_1,Unnamed: 135_level_1,Unnamed: 136_level_1,Unnamed: 137_level_1,Unnamed: 138_level_1,Unnamed: 139_level_1,Unnamed: 140_level_1,Unnamed: 141_level_1,Unnamed: 142_level_1,Unnamed: 143_level_1,Unnamed: 144_level_1,Unnamed: 145_level_1,Unnamed: 146_level_1,Unnamed: 147_level_1,Unnamed: 148_level_1,Unnamed: 149_level_1,Unnamed: 150_level_1,Unnamed: 151_level_1,Unnamed: 152_level_1,Unnamed: 153_level_1,Unnamed: 154_level_1,Unnamed: 155_level_1,Unnamed: 156_level_1,Unnamed: 157_level_1,Unnamed: 158_level_1,Unnamed: 159_level_1,Unnamed: 160_level_1,Unnamed: 161_level_1,Unnamed: 162_level_1,Unnamed: 163_level_1,Unnamed: 164_level_1,Unnamed: 165_level_1,Unnamed: 166_level_1,Unnamed: 167_level_1,Unnamed: 168_level_1,Unnamed: 169_level_1,Unnamed: 170_level_1,Unnamed: 171_level_1,Unnamed: 172_level_1,Unnamed: 173_level_1,Unnamed: 174_level_1,Unnamed: 175_level_1,Unnamed: 176_level_1
2987000,86400.0,68.5,4,3417,500,42,1,38,1,166,65,19.0,31,31,1.0,1.0,0.0,0.0,1.0,0.0,1.0,2.0,0.0,1.0,1.0,14.0,59.0,13.0,0.0,10.5,0.0,23.5,0.0,13.0,13.0,0.0,0.0,0.0,0.0,1,1,1,2,0,1,2,2,2,1.0,1.0,1.0,1.0,1.0,0.0,1.0,0.0,1.0,0.0,0.5,1.0,0.0,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,117.0,0.0,0.0,0.0,0.0,0.0,5155.0,2840.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,1.0,0.0,117.0,0.0,0.0,0.0,-2.5,84866.0,1.5,0.0,0.5,-2.5,1.5,0.0,100.0,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,0.0,0.0,5,68.0,5.0,16,24,7,4,51,16,24,8,13,293,7,68,0
2987001,86401.0,29.0,4,7922,303,42,2,2,1,173,65,27.5,16,31,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,1.0,1.0,0.0,59.0,12.0,0.0,10.5,0.0,23.5,0.0,0.0,6.5,0.0,0.0,0.0,0.0,2,2,2,0,1,1,2,2,2,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5155.0,2840.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,-2.5,84866.0,1.5,0.0,0.5,-2.5,1.5,0.0,100.0,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,0.0,0.0,5,29.0,0.0,12,15,2,10,30,16,24,8,13,293,7,68,0
2987002,86469.0,59.0,4,9383,389,42,4,58,2,178,65,287.0,36,31,1.0,1.0,0.0,0.0,1.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,59.0,10.5,0.0,10.5,0.0,23.5,0.0,0.0,315.0,0.0,0.0,0.0,315.0,1,1,1,0,0,0,0,0,0,1.0,1.0,1.0,1.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5155.0,2840.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,-2.5,84866.0,1.5,0.0,0.5,-2.5,1.5,0.0,100.0,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,0.0,1.0,5,59.0,0.0,15,28,2,12,39,16,24,8,13,293,7,68,0
2987003,86499.0,50.0,4,6991,466,42,2,14,2,282,65,68.5,54,31,2.0,5.0,0.0,0.0,4.0,0.0,1.0,1.0,0.0,25.0,1.0,112.0,112.0,0.0,94.0,0.0,0.0,83.0,0.0,84.0,19.5,0.0,0.0,0.0,111.0,2,2,2,0,1,0,2,2,2,1.0,1.0,1.0,1.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,1.0,1.0,0.0,10.0,1758.0,354.0,135.0,0.0,0.0,0.0,2577.5,1370.0,1.5,2.5,0.5,1.0,1.0,2.5,0.5,0.5,0.5,1.0,1.0,83.107697,45.163952,45.163952,45.163952,45.163952,37.943748,37.943748,1.5,2.5,1.0,2.5,0.5,0.5,0.5,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,83.107697,83.107697,83.107697,45.163952,45.163952,0.0,37.943748,0.0,0.0,0.0,1.0,0.0,1758.0,354.0,135.0,0.0,-5.0,206731.5,0.0,0.0,0.0,-3.0,0.0,0.0,100.0,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,0.0,1.0,5,50.0,0.0,30,43,2,9,46,16,24,8,13,293,7,68,0
2987004,86506.0,50.0,1,9262,413,42,2,2,1,241,65,161.5,16,31,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,1.0,1.0,0.0,66.5,20.5,0.0,20.5,17.5,110.0,0.0,0.0,157.5,17.5,159.5,0.0,157.5,2,2,2,3,2,2,2,2,2,1.0,1.0,1.0,1.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5155.0,2840.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,70787.0,0.0,0.0,0.5,-0.5,0.5,0.0,100.0,1,54,1,1,59,400,32,1,1,7,164,1,0,1,2,954,0.0,1.0,5,50.0,0.0,12,15,2,12,41,16,24,8,7,249,0,58,0


In [5]:
catf, numf = cat_num_features(train_data)

In [8]:
from sklearn.preprocessing import StandardScaler

In [9]:
scaler = StandardScaler()

scaler.fit(train_data[numf])

In [10]:
train_data[numf] = scaler.transform(train_data[numf])
test_data[numf] = scaler.transform(test_data[numf])

In [11]:
train_data.head()

Unnamed: 0_level_0,TransactionDT,TransactionAmt,ProductCD,card1,card2,card3,card4,card5,card6,addr1,addr2,dist1,P_emaildomain,R_emaildomain,C1,C2,C4,C5,C6,C7,C9,C11,C12,C13,C14,D1,D2,D3,D4,D5,D6,D8,D9,D10,D11,D12,D13,D14,D15,M1,M2,M3,M4,M5,M6,M7,M8,M9,V1,V3,V4,V6,V8,V11,V13,V18,V20,V30,V36,V37,V40,V44,V47,V48,V52,V54,V60,V70,V76,V78,V80,V81,V82,V87,V91,V99,V127,V130,V131,V139,V147,V156,V165,V166,V169,V171,V173,V174,V175,V176,V180,V183,V185,V195,V198,V203,V205,V207,V209,V210,V215,V216,V220,V221,V223,V230,V234,V235,V238,V240,V241,V250,V252,V257,V258,V260,V262,V263,V264,V265,V268,V271,V274,V277,V282,V283,V289,V291,V303,V307,V310,V312,V315,id_01,id_02,id_03,id_04,id_05,id_06,id_09,id_10,id_11,id_12,id_13,id_15,id_16,id_17,id_19,id_20,id_28,id_29,id_30,id_33,id_35,id_36,id_37,DeviceType,DeviceInfo,TransactionHR,TransactionMT,TransactionDW,dollars,cents,P_parent_domain,P_domain_name,P_top_level_domain,card1_div_1000,card2_div_10,R_parent_domain,R_domain_name,R_top_level_domain,device_name,device_version,os_name,os_version,isFraud
TransactionID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1,Unnamed: 95_level_1,Unnamed: 96_level_1,Unnamed: 97_level_1,Unnamed: 98_level_1,Unnamed: 99_level_1,Unnamed: 100_level_1,Unnamed: 101_level_1,Unnamed: 102_level_1,Unnamed: 103_level_1,Unnamed: 104_level_1,Unnamed: 105_level_1,Unnamed: 106_level_1,Unnamed: 107_level_1,Unnamed: 108_level_1,Unnamed: 109_level_1,Unnamed: 110_level_1,Unnamed: 111_level_1,Unnamed: 112_level_1,Unnamed: 113_level_1,Unnamed: 114_level_1,Unnamed: 115_level_1,Unnamed: 116_level_1,Unnamed: 117_level_1,Unnamed: 118_level_1,Unnamed: 119_level_1,Unnamed: 120_level_1,Unnamed: 121_level_1,Unnamed: 122_level_1,Unnamed: 123_level_1,Unnamed: 124_level_1,Unnamed: 125_level_1,Unnamed: 126_level_1,Unnamed: 127_level_1,Unnamed: 128_level_1,Unnamed: 129_level_1,Unnamed: 130_level_1,Unnamed: 131_level_1,Unnamed: 132_level_1,Unnamed: 133_level_1,Unnamed: 134_level_1,Unnamed: 135_level_1,Unnamed: 136_level_1,Unnamed: 137_level_1,Unnamed: 138_level_1,Unnamed: 139_level_1,Unnamed: 140_level_1,Unnamed: 141_level_1,Unnamed: 142_level_1,Unnamed: 143_level_1,Unnamed: 144_level_1,Unnamed: 145_level_1,Unnamed: 146_level_1,Unnamed: 147_level_1,Unnamed: 148_level_1,Unnamed: 149_level_1,Unnamed: 150_level_1,Unnamed: 151_level_1,Unnamed: 152_level_1,Unnamed: 153_level_1,Unnamed: 154_level_1,Unnamed: 155_level_1,Unnamed: 156_level_1,Unnamed: 157_level_1,Unnamed: 158_level_1,Unnamed: 159_level_1,Unnamed: 160_level_1,Unnamed: 161_level_1,Unnamed: 162_level_1,Unnamed: 163_level_1,Unnamed: 164_level_1,Unnamed: 165_level_1,Unnamed: 166_level_1,Unnamed: 167_level_1,Unnamed: 168_level_1,Unnamed: 169_level_1,Unnamed: 170_level_1,Unnamed: 171_level_1,Unnamed: 172_level_1,Unnamed: 173_level_1,Unnamed: 174_level_1,Unnamed: 175_level_1,Unnamed: 176_level_1
2987000,-1.577987,-0.278167,4,3417,500,42,1,38,1,166,65,-0.137532,31,31,-0.09802,-0.09226,-0.059438,-0.21606,-0.112869,-0.046146,-0.208712,-0.087363,-0.047034,-0.243806,-0.147247,-0.509782,-0.503333,-0.189393,-0.764989,-0.460267,-1.195934,-0.103737,-4.513538,-0.563826,-1.045689,-1.416108,-1.833103,-0.195921,-0.766342,1,1,1,2,0,1,2,2,2,0.010592,-0.175584,0.254143,-0.138091,-0.107737,-1.399366,0.890708,-0.540222,0.461255,-0.664176,0.061639,-0.193368,-0.50417,-0.168338,-0.142639,-0.809739,-0.366593,0.851647,-0.51961,-0.664404,0.913909,-0.234737,-0.521953,-0.508172,-1.7499,-0.208365,-0.694394,-0.328713,-0.051788,-0.291683,-0.193128,-0.925854,-0.085075,-1.348424,0.712571,2.676527,-0.910925,-0.280643,-1.102703,-1.135389,-0.963413,-0.639484,-0.074947,-0.080622,-0.121898,1.288134,1.113841,-0.069666,-0.417482,-0.155259,-0.470968,-0.910392,-0.063384,-0.051487,-0.865095,-0.430636,-1.072947,-0.46598,-0.091838,-0.097009,-0.110508,-0.009912,-0.004928,0.202858,-0.045803,-0.093392,-0.074128,0.045677,-0.02215,-0.13141,-0.093252,-0.105377,-0.261197,-0.936267,-0.047519,-0.043218,0.198889,0.006181,-0.394673,-0.040598,-0.454041,-0.066412,-0.334849,-0.227587,-0.230241,0.540805,-0.925067,5.187305,0.029746,-0.555474,0.369252,3.588854,0.106113,0.115225,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,-1.822224,-1.714835,5,-0.278668,-0.447183,16,24,7,4,51,16,24,8,13,293,7,68,0
2987001,-1.577986,-0.443327,4,7922,303,42,2,2,1,173,65,-0.102667,16,31,-0.09802,-0.09226,-0.059438,-0.21606,-0.112869,-0.046146,-0.268682,-0.097964,-0.047034,-0.243806,-0.147247,-0.598665,-0.503333,-0.210014,-0.764989,-0.460267,-1.195934,-0.103737,-4.513538,-0.638507,-1.093292,-1.416108,-1.833103,-0.195921,-0.766342,2,2,2,0,1,1,2,2,2,0.010592,-0.175584,0.254143,-0.138091,-0.107737,-1.399366,-0.977175,-0.540222,0.461255,-0.664176,-0.925159,-0.193368,-0.50417,-0.168338,-0.142639,-0.809739,-0.366593,-0.999398,-0.51961,-0.664404,-0.959375,-0.234737,-0.521953,-0.508172,0.498307,-0.208365,-0.694394,-0.328713,-0.079398,-0.291683,-0.193128,-0.925854,-0.085075,-1.348424,0.712571,2.676527,-0.910925,-0.280643,-1.102703,-1.135389,-0.963413,-0.639484,-0.074947,-0.080622,-0.121898,1.288134,1.113841,-0.069666,-0.417482,-0.155259,-0.470968,-0.910392,-0.063384,-0.051487,-0.865095,-0.430636,-1.072947,-0.46598,-0.091838,-0.097009,-0.110508,-0.009912,-0.004928,0.202858,-0.045803,-0.093392,-0.074128,0.045677,-0.02215,-0.13141,-0.093252,-0.105377,-0.261197,-0.936267,-0.047519,-0.043218,0.198889,0.006181,-0.394673,-0.040598,-0.454041,-0.093051,-0.334849,-0.227587,-0.230241,0.540805,-0.925067,5.187305,0.029746,-0.555474,0.369252,3.588854,0.106113,0.115225,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,-1.822224,-1.714835,5,-0.441734,-0.475884,12,15,2,10,30,16,24,8,13,293,7,68,0
2987002,-1.577972,-0.317889,4,9383,389,42,4,58,2,178,65,0.961748,36,31,-0.09802,-0.09226,-0.059438,-0.21606,-0.112869,-0.046146,-0.208712,-0.097964,-0.047034,-0.243806,-0.147247,-0.598665,-0.503333,-0.240946,-0.764989,-0.460267,-1.195934,-0.103737,-4.513538,-0.638507,1.165982,-1.416108,-1.833103,-0.195921,0.864292,1,1,1,0,0,0,0,0,0,0.010592,-0.175584,0.254143,-0.138091,-0.107737,-1.399366,0.890708,-0.540222,0.461255,-0.664176,1.048437,-0.193368,-0.50417,-0.168338,-0.142639,-0.809739,-0.366593,0.851647,-0.51961,-0.664404,0.913909,-0.234737,-0.521953,-0.508172,0.498307,-0.208365,-0.694394,-0.328713,-0.079398,-0.291683,-0.193128,-0.925854,-0.085075,-1.348424,0.712571,2.676527,-0.910925,-0.280643,-1.102703,-1.135389,-0.963413,-0.639484,-0.074947,-0.080622,-0.121898,1.288134,1.113841,-0.069666,-0.417482,-0.155259,-0.470968,-0.910392,-0.063384,-0.051487,-0.865095,-0.430636,-1.072947,-0.46598,-0.091838,-0.097009,-0.110508,-0.009912,-0.004928,0.202858,-0.045803,-0.093392,-0.074128,0.045677,-0.02215,-0.13141,-0.093252,-0.105377,-0.261197,-0.936267,-0.047519,-0.043218,0.198889,0.006181,-0.394673,-0.040598,-0.454041,-0.093051,-0.334849,-0.227587,-0.230241,0.540805,-0.925067,5.187305,0.029746,-0.555474,0.369252,3.588854,0.106113,0.115225,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,-1.822224,-1.656903,5,-0.316298,-0.475884,15,28,2,12,39,16,24,8,13,293,7,68,0
2987003,-1.577965,-0.355521,4,6991,466,42,2,14,2,282,65,0.065507,54,31,-0.090533,-0.066398,-0.059438,-0.21606,-0.070916,-0.046146,-0.208712,-0.097964,-0.047034,-0.058284,-0.147247,0.112393,-0.123779,-0.457466,-0.202238,-0.60071,-1.195934,0.391882,-4.513538,-0.15595,-0.998087,-1.416108,-1.833103,-0.195921,-0.191738,2,2,2,0,1,0,2,2,2,0.010592,-0.175584,0.254143,-0.138091,-0.107737,-1.399366,0.890708,-0.540222,0.461255,-0.664176,1.048437,-0.193368,-0.50417,-0.168338,-0.142639,-0.809739,-0.366593,0.851647,-0.51961,-0.664404,0.913909,-0.234737,-0.521953,-0.508172,0.498307,-0.208365,-0.694394,3.345226,0.335465,0.828993,0.644758,-0.925854,-0.085075,-1.348424,-0.027358,0.8263,1.445299,0.906446,-0.10519,0.854764,0.666399,0.88383,0.091329,0.264485,1.294943,1.288134,1.113841,-0.050992,-0.088065,-0.055352,-0.124329,-0.181534,0.011016,0.062627,1.368163,0.633307,0.815741,0.573303,-0.003175,1.05887,1.610972,-0.009912,-0.004928,0.202858,-0.045803,-0.093392,-0.074128,0.045677,-0.02215,0.004616,-0.038124,-0.02095,-0.071476,-0.171353,-0.047519,0.05374,-0.886776,-0.635981,-0.394673,-0.040598,-0.454041,0.307227,0.668043,0.55672,-0.230241,0.292792,0.121653,-0.09613,0.029746,-0.73258,0.30893,-0.07907,0.106113,0.115225,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,-1.822224,-1.656903,5,-0.353929,-0.475884,30,43,2,9,46,16,24,8,13,293,7,68,0
2987004,-1.577964,-0.355521,1,9262,413,42,2,2,1,241,65,0.446973,16,31,-0.09802,-0.09226,-0.059438,-0.21606,-0.112869,-0.046146,-0.268682,-0.097964,-0.047034,-0.243806,-0.147247,-0.598665,-0.449622,-0.034736,-0.764989,-0.326511,-1.009988,0.616784,-4.513538,-0.638507,0.012544,-1.217018,0.281952,-0.195921,0.048975,2,2,2,3,2,2,2,2,2,0.010592,-0.175584,0.254143,-0.138091,-0.107737,-1.399366,0.890708,-0.540222,0.461255,-0.664176,1.048437,-0.193368,-0.50417,-0.168338,-0.142639,-0.809739,-0.366593,0.851647,-0.51961,-0.664404,0.913909,-0.234737,-0.521953,-0.508172,0.498307,-0.208365,-0.694394,-0.328713,-0.079398,-0.291683,-0.193128,-0.925854,-0.085075,-1.348424,0.712571,2.676527,-0.910925,-0.280643,-1.102703,-1.135389,-0.963413,-0.639484,-0.074947,-0.080622,-0.121898,1.288134,1.113841,-0.069666,-0.417482,-0.155259,-0.470968,-0.910392,-0.063384,-0.051487,-0.865095,-0.430636,-1.072947,-0.46598,-0.091838,-0.097009,-0.110508,-0.009912,-0.004928,0.202858,-0.045803,-0.093392,-0.074128,0.045677,-0.02215,-0.13141,-0.093252,-0.105377,-0.261197,-0.936267,-0.047519,-0.043218,0.198889,0.006181,-0.394673,-0.040598,1.149541,-0.093051,-0.334849,-0.227587,-0.230241,0.788818,-1.045993,-0.09613,0.029746,-0.555474,0.610541,1.143572,0.106113,0.115225,1,54,1,1,59,400,32,1,1,7,164,1,0,1,2,954,-1.822224,-1.656903,5,-0.353929,-0.475884,12,15,2,12,41,16,24,8,7,249,0,58,0


In [12]:
test_data.head()

Unnamed: 0_level_0,TransactionDT,TransactionAmt,ProductCD,card1,card2,card3,card4,card5,card6,addr1,addr2,dist1,P_emaildomain,R_emaildomain,C1,C2,C4,C5,C6,C7,C9,C11,C12,C13,C14,D1,D2,D3,D4,D5,D6,D8,D9,D10,D11,D12,D13,D14,D15,M1,M2,M3,M4,M5,M6,M7,M8,M9,V1,V3,V4,V6,V8,V11,V13,V18,V20,V30,V36,V37,V40,V44,V47,V48,V52,V54,V60,V70,V76,V78,V80,V81,V82,V87,V91,V99,V127,V130,V131,V139,V147,V156,V165,V166,V169,V171,V173,V174,V175,V176,V180,V183,V185,V195,V198,V203,V205,V207,V209,V210,V215,V216,V220,V221,V223,V230,V234,V235,V238,V240,V241,V250,V252,V257,V258,V260,V262,V263,V264,V265,V268,V271,V274,V277,V282,V283,V289,V291,V303,V307,V310,V312,V315,id_01,id_02,id_03,id_04,id_05,id_06,id_09,id_10,id_11,id_12,id_13,id_15,id_16,id_17,id_19,id_20,id_28,id_29,id_30,id_33,id_35,id_36,id_37,DeviceType,DeviceInfo,TransactionHR,TransactionMT,TransactionDW,dollars,cents,card1_div_1000,card2_div_10,P_parent_domain,P_domain_name,P_top_level_domain,R_parent_domain,R_domain_name,R_top_level_domain,device_name,device_version,os_name,os_version
TransactionID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1,Unnamed: 95_level_1,Unnamed: 96_level_1,Unnamed: 97_level_1,Unnamed: 98_level_1,Unnamed: 99_level_1,Unnamed: 100_level_1,Unnamed: 101_level_1,Unnamed: 102_level_1,Unnamed: 103_level_1,Unnamed: 104_level_1,Unnamed: 105_level_1,Unnamed: 106_level_1,Unnamed: 107_level_1,Unnamed: 108_level_1,Unnamed: 109_level_1,Unnamed: 110_level_1,Unnamed: 111_level_1,Unnamed: 112_level_1,Unnamed: 113_level_1,Unnamed: 114_level_1,Unnamed: 115_level_1,Unnamed: 116_level_1,Unnamed: 117_level_1,Unnamed: 118_level_1,Unnamed: 119_level_1,Unnamed: 120_level_1,Unnamed: 121_level_1,Unnamed: 122_level_1,Unnamed: 123_level_1,Unnamed: 124_level_1,Unnamed: 125_level_1,Unnamed: 126_level_1,Unnamed: 127_level_1,Unnamed: 128_level_1,Unnamed: 129_level_1,Unnamed: 130_level_1,Unnamed: 131_level_1,Unnamed: 132_level_1,Unnamed: 133_level_1,Unnamed: 134_level_1,Unnamed: 135_level_1,Unnamed: 136_level_1,Unnamed: 137_level_1,Unnamed: 138_level_1,Unnamed: 139_level_1,Unnamed: 140_level_1,Unnamed: 141_level_1,Unnamed: 142_level_1,Unnamed: 143_level_1,Unnamed: 144_level_1,Unnamed: 145_level_1,Unnamed: 146_level_1,Unnamed: 147_level_1,Unnamed: 148_level_1,Unnamed: 149_level_1,Unnamed: 150_level_1,Unnamed: 151_level_1,Unnamed: 152_level_1,Unnamed: 153_level_1,Unnamed: 154_level_1,Unnamed: 155_level_1,Unnamed: 156_level_1,Unnamed: 157_level_1,Unnamed: 158_level_1,Unnamed: 159_level_1,Unnamed: 160_level_1,Unnamed: 161_level_1,Unnamed: 162_level_1,Unnamed: 163_level_1,Unnamed: 164_level_1,Unnamed: 165_level_1,Unnamed: 166_level_1,Unnamed: 167_level_1,Unnamed: 168_level_1,Unnamed: 169_level_1,Unnamed: 170_level_1,Unnamed: 171_level_1,Unnamed: 172_level_1,Unnamed: 173_level_1,Unnamed: 174_level_1,Unnamed: 175_level_1
3663549,2.389081,-0.430993,4,365,10,42,4,108,2,52,65,-0.211364,16,31,-0.060586,-0.059933,-0.059438,-0.099722,-0.070916,-0.046146,0.091141,-0.055562,-0.035495,0.637423,-0.046327,2.061453,2.074766,0.0993,1.617725,-0.23957,2.172352,-0.207859,-4.513538,1.762789,0.345759,-1.416108,-1.833103,-0.195921,1.350894,1,1,0,3,2,0,1,1,1,0.010592,-0.175584,0.254143,-0.138091,-0.107737,0.717255,-0.977175,-0.540222,-1.62176,-0.664176,1.048437,-0.193368,-0.50417,-0.168338,-0.142639,0.829141,-0.366593,-0.999398,-0.51961,-0.664404,-0.959375,-0.234737,-0.521953,-0.508172,0.498307,-0.208365,1.128298,0.03868,-0.068083,-0.139885,-0.193128,-0.234535,-0.085075,-0.025678,-0.767286,-0.898062,-0.910925,-0.280643,-1.102703,-0.140312,-0.148507,-0.639484,-0.074947,-0.080622,-0.121898,1.288134,1.113841,-0.065172,-0.417482,-0.155259,-0.317466,-0.587631,-0.063384,-0.051487,-0.865095,-0.430636,-1.072947,-0.46598,-0.091838,-0.097009,-0.110508,-0.009912,-0.004928,0.202858,-0.045803,-0.093392,-0.074128,0.045677,-0.02215,-0.13141,-0.093252,-0.105377,-0.261197,-0.936267,-0.047519,-0.043218,-0.886776,-0.635981,-0.394673,-0.040598,-0.454041,-0.082133,-0.199006,-0.227587,-0.230241,-1.443297,-0.434898,-0.09613,0.029746,-0.73258,0.670863,-0.07907,0.106113,0.115225,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,-1.822224,-1.714835,0,-0.433372,0.069444,1,1,12,15,2,16,24,8,13,293,7,68
3663550,2.38909,-0.359702,4,9099,10,42,4,108,2,151,65,-0.199059,2,31,-0.083047,-0.085795,-0.059438,-0.21606,-0.112869,-0.046146,-0.148741,-0.097964,-0.035495,-0.158775,-0.127063,0.347296,0.141192,-0.313119,3.030591,-0.507081,2.172352,-0.207859,-4.513538,0.688525,3.502151,1.809139,-1.833103,-0.195921,2.515632,1,0,0,0,2,0,2,2,2,0.010592,-0.175584,0.254143,-0.138091,-0.107737,-1.399366,0.890708,-0.540222,0.461255,-0.664176,1.048437,-0.193368,-0.50417,-0.168338,-0.142639,-0.809739,-0.366593,-0.999398,-0.51961,-0.664404,0.913909,-0.234737,-0.521953,-0.508172,0.498307,-0.208365,-0.694394,1.140862,-0.013322,0.594728,0.284777,-0.234535,-0.085075,-0.025678,-0.767286,-0.898062,-0.910925,-0.280643,-1.102703,-0.140312,-0.148507,-0.639484,-0.074947,-0.080622,-0.121898,1.288134,1.113841,-0.065172,-0.417482,-0.155259,-0.317466,-0.587631,-0.063384,-0.051487,-0.865095,-0.430636,-1.072947,-0.46598,-0.091838,-0.097009,-0.110508,-0.009912,-0.004928,0.202858,-0.045803,-0.093392,-0.074128,0.045677,-0.02215,-0.13141,-0.093252,-0.105377,-0.261197,-0.936267,-0.047519,-0.043218,-0.886776,-0.635981,-0.394673,-0.040598,-0.454041,-0.029298,0.458398,0.219758,-0.230241,-1.443297,-0.434898,-0.09613,0.029746,-0.73258,0.670863,-0.07907,0.106113,0.115225,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,-1.822224,-1.656903,0,-0.35811,-0.475884,12,1,2,2,2,16,24,8,13,293,7,68
3663551,2.3891,0.150412,4,9245,473,42,4,108,2,280,65,10.592751,19,31,-0.090533,-0.085795,-0.059438,-0.21606,-0.056932,-0.046146,-0.0288,-0.087363,-0.047034,-0.081474,-0.127063,0.271111,0.055255,-0.251256,-0.184277,-0.466954,2.172352,-0.207859,-4.513538,0.142776,-0.144909,-1.416108,-1.833103,-0.195921,-0.264211,1,1,0,0,0,0,0,0,0,0.010592,-0.175584,0.254143,-0.138091,-0.107737,-1.399366,0.890708,-0.540222,0.461255,-0.664176,1.048437,-0.193368,-0.50417,-0.168338,-0.142639,-0.809739,-0.366593,-0.999398,-0.51961,-0.664404,2.787192,1.135703,-0.521953,-0.508172,0.498307,-0.208365,-0.694394,0.773468,0.149036,1.940173,-0.193128,1.148103,-0.085075,-0.025678,-0.752933,-0.898062,-0.910925,-0.280643,-1.102703,-0.140312,-0.148507,-0.639484,-0.074947,-0.080622,-0.121898,1.288134,1.113841,-0.065172,-0.417482,-0.155259,-0.317466,-0.587631,-0.063384,-0.051487,-0.865095,-0.430636,-1.072947,-0.46598,-0.091838,-0.097009,-0.110508,-0.009912,-0.004928,0.202858,-0.045803,-0.093392,-0.074128,0.045677,-0.02215,-0.13141,-0.093252,-0.105377,-0.261197,-0.936267,-0.047519,-0.043218,-0.886776,-0.635981,-0.394673,0.020931,-0.454041,0.207727,2.662494,-0.227587,-0.230241,-1.443297,-0.434898,-0.09613,0.029746,-0.73258,0.670863,-0.07907,0.106113,0.115225,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,-1.822224,-1.656903,0,0.151996,-0.475884,12,47,15,17,2,16,24,8,13,293,7,68
3663552,2.3891,0.626866,4,870,259,42,4,58,2,79,65,-0.145736,16,31,-0.068073,-0.085795,-0.059438,-0.177281,-0.112869,-0.046146,-0.148741,-0.087363,-0.047034,-0.197426,-0.086695,-0.332018,-0.625076,0.387993,0.683797,-0.052312,-1.195934,-0.207859,-4.513538,0.751717,0.631372,-1.416108,-1.833103,-0.195921,0.486399,1,1,1,3,2,1,2,2,2,0.010592,-0.175584,0.254143,-0.138091,-0.107737,0.717255,0.890708,-0.540222,0.461255,1.202141,3.022033,1.475963,-0.50417,1.643501,4.914353,0.829141,-0.366593,0.851647,-0.51961,1.204801,0.913909,-0.234737,-0.521953,-0.508172,0.498307,-0.208365,1.128298,-0.328713,-0.079398,-0.291683,-0.193128,-0.234535,-0.085075,-0.025678,-0.767286,-0.898062,-0.910925,-0.280643,-1.102703,-1.135389,-0.963413,-0.639484,-0.074947,-0.080622,-0.121898,1.288134,1.113841,-0.069666,-0.417482,-0.155259,-0.470968,-0.910392,-0.063384,-0.051487,-0.865095,-0.430636,-1.072947,-0.46598,-0.091838,-0.097009,-0.110508,-0.009912,-0.004928,0.202858,-0.045803,-0.093392,-0.074128,0.045677,-0.02215,-0.13141,-0.093252,-0.105377,-0.261197,-0.936267,-0.047519,-0.043218,0.198889,0.006181,1.275505,-0.040598,-0.454041,-0.093051,-0.334849,-0.227587,2.189691,-1.69131,0.345129,-0.09613,0.029746,-0.555474,0.670863,-0.07907,0.106113,0.115225,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,-1.822224,-1.656903,0,0.624472,0.069444,1,26,12,15,2,16,24,8,13,293,7,68
3663553,2.389101,-0.280467,4,6894,351,42,2,14,2,127,65,-0.190855,16,31,-0.060586,-0.059933,-0.059438,-0.138501,-0.056932,-0.046146,0.03117,-0.044962,-0.047034,-0.143315,-0.046327,-0.458993,-0.768304,-0.457466,-0.633281,-0.60071,-1.195934,-0.207859,-4.513538,-0.512123,-0.979779,-1.416108,-1.833103,-0.195921,-0.652457,1,1,1,3,2,0,0,1,1,0.010592,-0.175584,0.254143,-0.138091,-0.107737,0.717255,0.890708,-0.540222,0.461255,1.202141,1.048437,-0.193368,-0.50417,-0.168338,-0.142639,0.829141,-0.366593,0.851647,-0.51961,1.204801,0.913909,-0.234737,-0.521953,-0.508172,0.498307,-0.208365,1.128298,0.773468,-0.036012,0.29034,0.228608,-0.234535,-0.085075,-0.025678,-0.767286,-0.898062,-0.910925,-0.280643,-1.102703,-1.135389,-0.963413,-0.639484,-0.074947,-0.080622,-0.121898,1.288134,1.113841,-0.069666,-0.417482,-0.155259,-0.470968,-0.910392,-0.063384,-0.051487,-0.865095,-0.430636,-1.072947,-0.46598,-0.091838,-0.097009,-0.110508,-0.009912,-0.004928,0.202858,-0.045803,-0.093392,-0.074128,0.045677,-0.02215,-0.13141,-0.093252,-0.105377,-0.261197,-0.936267,-0.047519,-0.043218,0.198889,0.006181,1.275505,-0.040598,-0.454041,-0.05119,0.186003,0.167181,0.351745,-1.69131,0.345129,-0.09613,0.029746,-0.555474,0.670863,-0.07907,0.106113,0.115225,2,54,3,2,104,522,394,2,2,74,260,2,2,2,1,1735,-1.822224,-1.656903,0,-0.282849,0.069444,9,35,12,15,2,16,24,8,13,293,7,68


In [13]:
train_data.to_pickle('train_knn_scaled.pkl')
test_data.to_pickle('test_knn_scaled.pkl')